diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index a57773ac6c..7a4e6b6a78 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -12,12 +12,12 @@ jobs:
       matrix:
         os: [ubuntu-latest, windows-latest, macOS-latest]
         # choosing to run a reduced set of LTS, current, and next, to balance coverage and execution time
-        java: [8, 17, 20]
+        java: [8, 17, 21]
       fail-fast: false
     name: Test JDK ${{ matrix.java }}, ${{ matrix.os }}
     steps:
       - name: Checkout
-        uses: actions/checkout@v3
+        uses: actions/checkout@v4
 
       - name: Set up JDK ${{ matrix.java }}
         uses: actions/setup-java@v3
diff --git a/.github/workflows/cifuzz.yml b/.github/workflows/cifuzz.yml
index 3d265ab557..23df68aa2c 100644
--- a/.github/workflows/cifuzz.yml
+++ b/.github/workflows/cifuzz.yml
@@ -19,7 +19,7 @@ jobs:
         dry-run: false
         language: jvm
     - name: Upload Crash
-      uses: actions/upload-artifact@v1
+      uses: actions/upload-artifact@v3
       if: failure() && steps.build.outcome == 'success'
       with:
         name: artifacts
diff --git a/.github/workflows/codeql.yml b/.github/workflows/codeql.yml
index 7eaa5be624..0eea129b29 100644
--- a/.github/workflows/codeql.yml
+++ b/.github/workflows/codeql.yml
@@ -14,7 +14,7 @@ jobs:
     name: "CodeQL"
     steps:
       - name: Checkout
-        uses: actions/checkout@v3
+        uses: actions/checkout@v4
       - name: Set up JDK
         uses: actions/setup-java@v3
         with:
diff --git a/CHANGES b/CHANGES
index 9f05522ca6..4eaed85ac6 100644
--- a/CHANGES
+++ b/CHANGES
@@ -1,6 +1,84 @@
 jsoup changelog
 
-Release 1.16.2 [PENDING]
+Release 1.17.1 [PENDING]
+  * Improvement: in Jsoup.connect(), added support for request-level authentication, supporting authentication to
+    proxies and to servers.
+    <https://github.com/jhy/jsoup/pull/2046>
+
+  * Improvement: in the Elements list, added direct support for `#set(index, element)`, `#remove(index)`,
+    `#remove(object)`, `#clear()`, `#removeAll(collection)`, `#retainAll(collection)`, `#removeIf(filter)`,
+    `#replaceAll(operator)`. These methods update the original DOM, as well as the Elements list.
+    <https://github.com/jhy/jsoup/pull/2017>
+
+  * Improvement: added the NodeIterator class, to efficiently traverse a node tree using the Iterator interface. And
+    added Stream Element#stream() and Node#nodeStream() methods, to enable fluent composable stream pipelines of node
+    traversals.
+    <https://github.com/jhy/jsoup/pull/2051>
+
+  * Improvement: when changing the OutputSettings syntax to XML, the xhtml EscapeMode is automatically set by default.
+
+  * Improvement: added the `:is(selector list)` pseudo-selector, which finds elements that match any of the selectors in
+    the selector list. Useful for making large ORed selectors more readable.
+
+  * Improvement: repackaged the library with native (vs automatic) JPMS module support.
+    <https://github.com/jhy/jsoup/pull/2025>
+
+  * Improvement: better fidelity of source positions when tracking is enabled. And implicitly created or closed elements
+    are tracked and detectable via Range.isImplicit().
+    <https://github.com/jhy/jsoup/pull/2056>
+
+  * Improvement: when source tracking is enabled, the source position for attribute names and values is now available.
+    Attribute#sourceRange() provides the ranges.
+    <https://github.com/jhy/jsoup/pull/2057>
+
+  * Improvement: when running concurrently under Java 21+ Virtual Threads, virtual threads could be pinned to their
+    carrier platform thread when parsing an input stream. To improve performance, particularly when parsing fetched
+    URLs, the internal ConstrainableInputStream has been replaced by ControllableInputStream, which avoids the locking
+    which caused that pinning.
+    <https://github.com/jhy/jsoup/issues/2054>
+
+  * Improvement: in Jsoup.Connect, allow any XML mimetype as a supported mimetype. Was previously limited to
+    `{application|text}/xml`. This enables for e.g. fetching SVGs with a image/svg+xml mimetype, without having to
+    disable mimetype validation.
+    <https://github.com/jhy/jsoup/issues/2059>
+
+  * Bugfix: when outputting with XML syntax, HTML elements that were parsed as data nodes (<script> and <style>) should
+    be emitted as CDATA nodes, so that they can be parsed correctly by an XML parser.
+    <https://github.com/jhy/jsoup/pull/1720>
+
+  * Bugfix: the Immediate Parent selector `>` could match elements above the root context element, causing incorrect
+    elements to be returned when used on elements other than the root document.
+    <https://github.com/jhy/jsoup/issues/2018>
+
+  * Bugfix: in a sub-query such as `p:has(> span, > i)`, combinators following the `,` Or combinator would be
+    incorrectly skipped, such that the sub-query was parsed as `i` instead of `> i`.
+    <https://github.com/jhy/jsoup/issues/1707>
+
+  * Bugfix: in W3CDom, if the jsoup input document contained an empty doctype, the conversion would fail with a
+    DOMException. Now, said doctype is discarded, and the conversion continues.
+
+  * Bugfix: when cleaning a document containing SVG elements (or other foreign elements that have preserved case names),
+    the cleaned output would be incorrectly nested if the safelist had a different case than the input document.
+    <https://github.com/jhy/jsoup/issues/2049>
+
+  * Bugfix: when cleaning a document, the output style of unknown self-closing tags from the input was not preserved in
+    the output. (So a <foo /> in the input, if safe-listed, would be output as <foo></foo>.)
+    <https://github.com/jhy/jsoup/issues/2049>
+
+  * Build Improvement: added a local test proxy implementation, for proxy integration tests.
+    <https://github.com/jhy/jsoup/pull/2029>
+
+  * Build Improvement: added tests for HTTPS request support, using a local self-signed cert. Includes proxy tests.
+    <https://github.com/jhy/jsoup/pull/2032>
+
+  * Change: the InputStream returned in Connection.Response.bodyStream() is no longer a ConstrainedInputStream, and
+    so is not subject to settings such as timeout or maximum size. It is now a plain BufferedInputStream around the
+    response stream. Whilst this behaviour was not documented, you may have been inadvertently relying on those
+    constraints. The constraints are still applied to other methods such as .parse() and .bufferUp(). So if you do want
+    a constrained BufferedInputStream, you may do Connection.Response.bufferUp().bodyStream().
+    <https://github.com/jhy/jsoup/issues/2054>
+
+Release 1.16.2 [20-Oct-2023]
   * Improvement: optimized the performance of complex CSS selectors, by adding a cost-based query planner. Evaluators
     are sorted by their relative execution cost, and executed in order of lower to higher cost. This speeds the
     matching process by ensuring that simpler evaluations (such as a tag name match) are conducted prior to more
diff --git a/README.md b/README.md
index 96033b8272..99f5e48c3b 100644
--- a/README.md
+++ b/README.md
@@ -1,8 +1,8 @@
 # jsoup: Java HTML Parser
 
-**jsoup** is a Java library for working with real-world HTML. It provides a very convenient API for fetching URLs and extracting and manipulating data, using the best of HTML5 DOM methods and CSS selectors.
+**jsoup** is a Java library that simplifies working with real-world HTML and XML. It offers an easy-to-use API for URL fetching, data parsing, extraction, and manipulation using DOM API methods, CSS, and xpath selectors.
 
-**jsoup** implements the [WHATWG HTML5](https://html.spec.whatwg.org/multipage/) specification, and parses HTML to the same DOM as modern browsers do.
+**jsoup** implements the [WHATWG HTML5](https://html.spec.whatwg.org/multipage/) specification, and parses HTML to the same DOM as modern browsers.
 
 * scrape and [parse](https://jsoup.org/cookbook/input/parse-document-from-string) HTML from a URL, file, or string
 * find and [extract data](https://jsoup.org/cookbook/extracting-data/selector-syntax), using DOM traversal or CSS selectors
diff --git a/pom.xml b/pom.xml
index fbb8369ea1..6dbab97841 100644
--- a/pom.xml
+++ b/pom.xml
@@ -5,9 +5,9 @@
 
   <groupId>org.jsoup</groupId>
   <artifactId>jsoup</artifactId>
-  <version>1.16.2</version><!-- remember to update previous version below for japicmp -->
-  <description>jsoup is a Java library for working with real-world HTML. It provides a very convenient API for fetching URLs and extracting and manipulating data, using the best of HTML5 DOM methods and CSS selectors. jsoup implements the WHATWG HTML5 specification, and parses HTML to the same DOM as modern browsers do.</description>
+  <version>1.17.1</version><!-- remember to update previous version below for japicmp -->
   <url>https://jsoup.org/</url>
+  <description>jsoup is a Java library that simplifies working with real-world HTML and XML. It offers an easy-to-use API for URL fetching, data parsing, extraction, and manipulation using DOM API methods, CSS, and xpath selectors. jsoup implements the WHATWG HTML5 specification, and parses HTML to the same DOM as modern browsers.</description>
   <inceptionYear>2009</inceptionYear>
   <issueManagement>
     <system>GitHub</system>
@@ -24,7 +24,7 @@
     <url>https://github.com/jhy/jsoup</url>
     <connection>scm:git:https://github.com/jhy/jsoup.git</connection>
     <!-- <developerConnection>scm:git:git@github.com:jhy/jsoup.git</developerConnection> -->
-    <tag>jsoup-1.16.2</tag>
+    <tag>jsoup-1.17.1</tag>
   </scm>
   <organization>
     <name>Jonathan Hedley</name>
@@ -38,13 +38,12 @@
 
   <build>
     <plugins>
+      <!-- Compile -->
       <plugin>
         <groupId>org.apache.maven.plugins</groupId>
         <artifactId>maven-compiler-plugin</artifactId>
         <version>3.11.0</version>
         <configuration>
-          <source>1.8</source>
-          <target>1.8</target>
           <encoding>UTF-8</encoding>
           <compilerArgs>
             <!-- saves output for package-info.java, so mvn sees it has completed it, so incremental compile works -->
@@ -53,9 +52,20 @@
           <!-- this means incremental = true... -->
           <useIncrementalCompilation>false</useIncrementalCompilation>
         </configuration>
+        <executions>
+          <execution>
+            <id>compile-java-8</id>
+            <configuration>
+              <source>1.8</source>
+              <target>1.8</target>
+            </configuration>
+          </execution>
+          <!-- There is a JDK 9+ profile execution below, which adds multi-release=true and compiles module-info -->
+        </executions>
       </plugin>
+
+      <!-- Ensure Java 8 and Android 10 API compatibility -->
       <plugin>
-        <!-- Ensure Java 8 and Android 10 API compatibility -->
         <groupId>org.codehaus.mojo</groupId>
         <artifactId>animal-sniffer-maven-plugin</artifactId>
         <version>1.23</version>
@@ -82,6 +92,17 @@
                 <ignore>java.util.function.Supplier</ignore>
                 <ignore>java.lang.ThreadLocal</ignore>
                 <ignore>java.io.UncheckedIOException</ignore>
+                <ignore>java.util.function.Predicate</ignore>
+                <ignore>java.util.function.UnaryOperator</ignore>
+                <ignore>java.util.stream.Stream</ignore>
+                <ignore>java.util.stream.StreamSupport</ignore>
+                <ignore>java.util.Spliterator</ignore>
+                <ignore>java.util.Spliterators</ignore>
+                <ignore>java.util.Optional</ignore>
+                <ignore>java.util.stream.Collector</ignore>
+                <ignore>java.util.stream.Collectors</ignore>
+
+                <ignore>java.net.HttpURLConnection</ignore><!-- .setAuthenticator(java.net.Authenticator) in Java 9; only used in multirelease 9+ version -->
               </ignores>
               <!-- ^ Provided by https://developer.android.com/studio/write/java8-support#library-desugaring
                Possibly OK to remove androidscents; keep for now to validate other additions are supported. -->
@@ -92,15 +113,15 @@
       <plugin>
         <groupId>org.apache.maven.plugins</groupId>
         <artifactId>maven-javadoc-plugin</artifactId>
-        <version>3.6.0</version>
+        <version>3.6.2</version>
         <configuration>
-            <doclint>none</doclint>
-            <source>8</source>
+          <doclint>none</doclint>
+          <source>8</source>
+          <linksource>true</linksource>
         </configuration>
         <executions>
           <execution>
             <id>attach-javadoc</id>
-            <phase>verify</phase>
             <goals>
               <goal>jar</goal>
             </goals>
@@ -119,9 +140,8 @@
         <executions>
           <execution>
             <id>attach-sources</id>
-            <phase>verify</phase>
             <goals>
-              <goal>jar</goal>
+              <goal>jar-no-fork</goal>
             </goals>
           </execution>
         </executions>
@@ -136,7 +156,7 @@
               <addDefaultImplementationEntries>true</addDefaultImplementationEntries>
             </manifest>
             <manifestEntries>
-              <Automatic-Module-Name>org.jsoup</Automatic-Module-Name>
+              <Multi-Release>true</Multi-Release>
             </manifestEntries>
             <manifestFile>${project.build.outputDirectory}/META-INF/MANIFEST.MF</manifestFile>
           </archive>
@@ -162,7 +182,7 @@
           <instructions>
             <Bundle-DocURL>https://jsoup.org/</Bundle-DocURL>
             <Export-Package>org.jsoup.*</Export-Package>
-            <Import-Package>javax.annotation;version=!;resolution:=optional,javax.annotation.meta;version=!;resolution:=optional,*</Import-Package>
+            <Import-Package>org.jspecify.annotations;version=!;resolution:=optional,*</Import-Package>
           </instructions>
         </configuration>
       </plugin>
@@ -178,7 +198,7 @@
       <plugin>
         <groupId>org.apache.maven.plugins</groupId>
         <artifactId>maven-surefire-plugin</artifactId>
-        <version>3.1.2</version>
+        <version>3.2.2</version>
         <configuration>
           <!-- smaller stack to find stack overflows -->
           <argLine>-Xss256k</argLine>
@@ -186,7 +206,7 @@
       </plugin>
       <plugin>
         <artifactId>maven-failsafe-plugin</artifactId>
-        <version>3.1.2</version>
+        <version>3.2.2</version>
         <executions>
           <execution>
             <goals>
@@ -204,14 +224,14 @@
         <!-- API version compat check - https://siom79.github.io/japicmp/ -->
         <groupId>com.github.siom79.japicmp</groupId>
         <artifactId>japicmp-maven-plugin</artifactId>
-        <version>0.18.1</version>
+        <version>0.18.3</version>
         <configuration>
           <!-- hard code previous version; can't detect when running stateless on build server -->
           <oldVersion>
             <dependency>
               <groupId>org.jsoup</groupId>
               <artifactId>jsoup</artifactId>
-              <version>1.16.1</version>
+              <version>1.16.2</version>
               <type>jar</type>
             </dependency>
           </oldVersion>
@@ -221,7 +241,7 @@
             <breakBuildOnBinaryIncompatibleModifications>true</breakBuildOnBinaryIncompatibleModifications>
             <breakBuildOnSourceIncompatibleModifications>true</breakBuildOnSourceIncompatibleModifications>
             <excludes>
-              <exclude>@java.lang.Deprecated</exclude>
+              <!-- <exclude>@java.lang.Deprecated</exclude> -->
             </excludes>
             <overrideCompatibilityChangeParameters>
               <!-- allows new default and move to default methods. compatible as long as existing binaries aren't making calls via reflection. if so, they need to catch errors anyway. -->
@@ -235,6 +255,18 @@
                 <binaryCompatible>true</binaryCompatible>
                 <sourceCompatible>true</sourceCompatible>
               </overrideCompatibilityChangeParameter>
+
+              <!--
+                One off, getting a spurious ping on adding [<T extends Node> Stream<T> nodeStream(Class<T> class)] to Node.
+                Manually verified binary & source compatibility
+                todo: remove after 1.17.1 release
+               -->
+              <overrideCompatibilityChangeParameter>
+                <compatibilityChange>CLASS_GENERIC_TEMPLATE_CHANGED</compatibilityChange>
+                <binaryCompatible>true</binaryCompatible>
+                <sourceCompatible>true</sourceCompatible>
+              </overrideCompatibilityChangeParameter>
+
             </overrideCompatibilityChangeParameters>
           </parameter>
         </configuration>
@@ -276,6 +308,44 @@
   </distributionManagement>
 
   <profiles>
+    <!-- Compiles the multi-release jar when executed on JDK9+ -->
+    <profile>
+      <id>compile-multi-release</id>
+      <activation>
+        <jdk>[9,2000)</jdk>
+      </activation>
+      <build>
+        <plugins>
+          <plugin>
+            <groupId>org.apache.maven.plugins</groupId>
+            <artifactId>maven-compiler-plugin</artifactId>
+            <executions>
+              <execution>
+                <id>compile-java-8</id>
+                <configuration>
+                  <release>8</release>
+                </configuration>
+              </execution>
+              <execution>
+                <id>compile-java-9</id>
+                <phase>compile</phase>
+                <goals>
+                  <goal>compile</goal>
+                </goals>
+                <configuration>
+                  <release>9</release>
+                  <compileSourceRoots>
+                    <compileSourceRoot>${project.basedir}/src/main/java9</compileSourceRoot>
+                  </compileSourceRoots>
+                  <multiReleaseOutput>true</multiReleaseOutput>
+                </configuration>
+              </execution>
+            </executions>
+          </plugin>
+        </plugins>
+      </build>
+    </profile>
+
     <profile>
       <id>release-sign-artifacts</id>
       <activation>
@@ -292,7 +362,7 @@
             <executions>
               <execution>
                 <id>sign-artifacts</id>
-                <phase>verify</phase>
+                <phase>package</phase>
                 <goals>
                   <goal>sign</goal>
                 </goals>
@@ -308,7 +378,7 @@
         <plugins>
           <plugin>
             <artifactId>maven-failsafe-plugin</artifactId>
-            <version>3.1.2</version>
+            <version>3.2.2</version>
             <executions>
               <execution>
                 <goals>
@@ -329,7 +399,7 @@
     <dependency>
       <groupId>org.junit.jupiter</groupId>
       <artifactId>junit-jupiter</artifactId>
-      <version>5.10.0</version>
+      <version>5.10.1</version>
       <scope>test</scope>
     </dependency>
 
@@ -358,10 +428,18 @@
     </dependency>
 
     <dependency>
-      <!-- javax.annotations.nonnull, with Apache 2 (not GPL) license. Build time only. -->
-      <groupId>com.google.code.findbugs</groupId>
-      <artifactId>jsr305</artifactId>
-      <version>3.0.2</version>
+      <!-- jetty proxy, for integration tests -->
+      <groupId>org.eclipse.jetty</groupId>
+      <artifactId>jetty-proxy</artifactId>
+      <version>${jetty.version}</version>
+      <scope>test</scope>
+    </dependency>
+
+    <dependency>
+      <!-- org.jspecify.annotations.nonnull, with Apache 2 license. Build time only. -->
+      <groupId>org.jspecify</groupId>
+      <artifactId>jspecify</artifactId>
+      <version>0.3.0</version>
       <scope>provided</scope>
     </dependency>
   </dependencies>
diff --git a/src/main/java/org/jsoup/Connection.java b/src/main/java/org/jsoup/Connection.java
index f422debcb7..84b6fb8421 100644
--- a/src/main/java/org/jsoup/Connection.java
+++ b/src/main/java/org/jsoup/Connection.java
@@ -1,14 +1,16 @@
 package org.jsoup;
 
+import org.jsoup.helper.RequestAuthenticator;
 import org.jsoup.nodes.Document;
 import org.jsoup.parser.Parser;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import javax.net.ssl.SSLSocketFactory;
 import java.io.BufferedInputStream;
 import java.io.IOException;
 import java.io.InputStream;
 import java.io.UncheckedIOException;
+import java.net.Authenticator;
 import java.net.CookieStore;
 import java.net.Proxy;
 import java.net.URL;
@@ -28,14 +30,14 @@
  cookie store. The cookie store for the session is available via {@link #cookieStore()}. You may provide your own
  implementation via {@link #cookieStore(java.net.CookieStore)} before making requests.</p>
  <p>Request configuration can be made using either the shortcut methods in Connection (e.g. {@link #userAgent(String)}),
- or by methods in the Connection.Request object directly. All request configuration must be made before the request is
+ or by methods in the {@link Connection.Request} object directly. All request configuration must be made before the request is
  executed. When used as an ongoing session, initialize all defaults prior to making multi-threaded {@link
 #newRequest()}s.</p>
  <p>Note that the term "Connection" used here does not mean that a long-lived connection is held against a server for
  the lifetime of the Connection object. A socket connection is only made at the point of request execution ({@link
 #execute()}, {@link #get()}, or {@link #post()}), and the server's response consumed.</p>
  <p>For multi-threaded implementations, it is important to use a {@link #newRequest()} for each request. The session may
- be shared across threads but a given request, not.</p>
+ be shared across concurrent threads, but a not a specific request.</p>
  */
 @SuppressWarnings("unused")
 public interface Connection {
@@ -62,12 +64,35 @@ public final boolean hasBody() {
     }
 
     /**
-     Creates a new request, using this Connection as the session-state and to initialize the connection settings (which may then be independently on the returned Connection.Request object).
+     Creates a new request, using this Connection as the session-state and to initialize the connection settings (which
+     may then be independently changed on the returned {@link Connection.Request} object).
      @return a new Connection object, with a shared Cookie Store and initialized settings from this Connection and Request
      @since 1.14.1
      */
     Connection newRequest();
 
+    /**
+     Creates a new request, using this Connection as the session-state and to initialize the connection settings (which
+     may then be independently changed on the returned {@link Connection.Request} object).
+     @return a new Connection object, with a shared Cookie Store and initialized settings from this Connection and Request
+     @param url URL for the new request
+     @since 1.17.1
+     */
+    default Connection newRequest(String url) {
+        return newRequest().url(url);
+    }
+
+    /**
+     Creates a new request, using this Connection as the session-state and to initialize the connection settings (which
+     may then be independently changed on the returned {@link Connection.Request} object).
+     @return a new Connection object, with a shared Cookie Store and initialized settings from this Connection and Request
+     @param url URL for the new request
+     @since 1.17.1
+     */
+    default Connection newRequest(URL url) {
+        return newRequest().url(url);
+    }
+
     /**
      * Set the request URL to fetch. The protocol must be HTTP or HTTPS.
      * @param url URL to connect to
@@ -135,7 +160,7 @@ public final boolean hasBody() {
     Connection referrer(String referrer);
 
     /**
-     * Configures the connection to (not) follow server redirects. By default this is <b>true</b>.
+     * Configures the connection to (not) follow server redirects. By default, this is <b>true</b>.
      * @param followRedirects true if server redirects should be followed.
      * @return this Connection, for chaining
      */
@@ -149,8 +174,8 @@ public final boolean hasBody() {
     Connection method(Method method);
 
     /**
-     * Configures the connection to not throw exceptions when a HTTP error occurs. (4xx - 5xx, e.g. 404 or 500). By
-     * default this is <b>false</b>; an IOException is thrown if an error is encountered. If set to <b>true</b>, the
+     * Configures the connection to not throw exceptions when an HTTP error occurs. (4xx - 5xx, e.g. 404 or 500). By
+     * default, this is <b>false</b>; an IOException is thrown if an error is encountered. If set to <b>true</b>, the
      * response is populated with the error body, and the status message will reflect the error.
      * @param ignoreHttpErrors - false (default) if HTTP errors should be ignored.
      * @return this Connection, for chaining
@@ -158,7 +183,7 @@ public final boolean hasBody() {
     Connection ignoreHttpErrors(boolean ignoreHttpErrors);
 
     /**
-     * Ignore the document's Content-Type when parsing the response. By default this is <b>false</b>, an unrecognised
+     * Ignore the document's Content-Type when parsing the response. By default, this is <b>false</b>, an unrecognised
      * content-type will cause an IOException to be thrown. (This is to prevent producing garbage by attempting to parse
      * a JPEG binary image, for example.) Set to true to force a parse attempt regardless of content type.
      * @param ignoreContentType set to true if you would like the content type ignored on parsing the response into a
@@ -186,13 +211,14 @@ public final boolean hasBody() {
     /**
      * Add an input stream as a request data parameter. For GETs, has no effect, but for POSTS this will upload the
      * input stream.
+     * <p>Use the {@link #data(String, String, InputStream, String)} method to set the uploaded file's mimetype.</p>
      * @param key data key (form item name)
      * @param filename the name of the file to present to the remove server. Typically just the name, not path,
      * component.
      * @param inputStream the input stream to upload, that you probably obtained from a {@link java.io.FileInputStream}.
      * You must close the InputStream in a {@code finally} block.
-     * @return this Connections, for chaining
-     * @see #data(String, String, InputStream, String) if you want to set the uploaded file's mimetype.
+     * @return this Connection, for chaining
+     * @see #data(String, String, InputStream, String)
      */
     Connection data(String key, String filename, InputStream inputStream);
 
@@ -205,7 +231,7 @@ public final boolean hasBody() {
      * @param inputStream the input stream to upload, that you probably obtained from a {@link java.io.FileInputStream}.
      * @param contentType the Content Type (aka mimetype) to specify for this file.
      * You must close the InputStream in a {@code finally} block.
-     * @return this Connections, for chaining
+     * @return this Connection, for chaining
      */
     Connection data(String key, String filename, InputStream inputStream, String contentType);
 
@@ -224,12 +250,13 @@ public final boolean hasBody() {
     Connection data(Map<String, String> data);
 
     /**
-     Add one or more request {@code key, val} data parameter pairs.<p>Multiple parameters may be set at once, e.g.:
+     Add one or more request {@code key, val} data parameter pairs.
+     <p>Multiple parameters may be set at once, e.g.:
      <code>.data("name", "jsoup", "language", "Java", "language", "English");</code> creates a query string like:
      <code>{@literal ?name=jsoup&language=Java&language=English}</code></p>
      <p>For GET requests, data parameters will be sent on the request query string. For POST (and other methods that
-     contain a body), they will be sent as body form parameters, unless the body is explicitly set by {@link
-    #requestBody(String)}, in which case they will be query string parameters.</p>
+     contain a body), they will be sent as body form parameters, unless the body is explicitly set by
+     {@link #requestBody(String)}, in which case they will be query string parameters.</p>
 
      @param keyvals a set of key value pairs.
      @return this Connection, for chaining
@@ -244,8 +271,8 @@ <p>For GET requests, data parameters will be sent on the request query string. F
     @Nullable KeyVal data(String key);
 
     /**
-     * Set a POST (or PUT) request body. Useful when a server expects a plain request body, not a set for URL
-     * encoded form key/value pairs. E.g.:
+     * Set a POST (or PUT) request body. Useful when a server expects a plain request body (such as JSON), and not a set
+     * of URL encoded form key/value pairs. E.g.:
      * <code><pre>Jsoup.connect(url)
      * .requestBody(json)
      * .header("Content-Type", "application/json")
@@ -256,16 +283,18 @@ <p>For GET requests, data parameters will be sent on the request query string. F
     Connection requestBody(String body);
 
     /**
-     * Set a request header.
+     * Set a request header. Replaces any existing header with the same case-insensitive name.
      * @param name header name
      * @param value header value
      * @return this Connection, for chaining
+     * @see org.jsoup.Connection.Request#header(String, String)
      * @see org.jsoup.Connection.Request#headers()
      */
     Connection header(String name, String value);
 
     /**
-     * Adds each of the supplied headers to the request.
+     * Sets each of the supplied headers on the request. Existing headers with the same case-insensitive name will be
+     * replaced with the new value.
      * @param headers map of headers name {@literal ->} value pairs
      * @return this Connection, for chaining
      * @see org.jsoup.Connection.Request#headers()
@@ -303,24 +332,83 @@ <p>For GET requests, data parameters will be sent on the request query string. F
     CookieStore cookieStore();
 
     /**
-     * Provide an alternate parser to use when parsing the response to a Document. If not set, defaults to the HTML
-     * parser, unless the response content-type is XML, in which case the XML parser is used.
+     * Provide a specific parser to use when parsing the response to a Document. If not set, jsoup defaults to the
+     * {@link Parser#htmlParser() HTML parser}, unless the response content-type is XML, in which case the
+     * {@link Parser#xmlParser() XML parser} is used.
      * @param parser alternate parser
      * @return this Connection, for chaining
      */
     Connection parser(Parser parser);
 
     /**
-     * Sets the default post data character set for x-www-form-urlencoded post data
+     * Set the character-set used to encode for x-www-form-urlencoded post data. Defaults to {@code UTF-8}.
      * @param charset character set to encode post data
      * @return this Connection, for chaining
      */
     Connection postDataCharset(String charset);
 
+    /**
+     Set the authenticator to use for this connection, enabling requests to URLs, and via proxies, that require
+     authentication credentials.
+     <p>The authentication scheme used is automatically detected during the request execution.
+     Supported schemes (subject to the platform) are {@code basic}, {@code digest}, {@code NTLM},
+     and {@code Kerberos}.</p>
+
+     <p>To use, supply a {@link RequestAuthenticator} function that:
+     <ol>
+     <li>validates the URL that is requesting authentication, and</li>
+     <li>returns the appropriate credentials (username and password)</li>
+     </ol>
+     </p>
+
+     <p>For example, to authenticate both to a proxy and a downstream web server:
+     <code><pre>
+     Connection session = Jsoup.newSession()
+         .proxy("proxy.example.com", 8080)
+         .auth(auth -> {
+             if (auth.isServer()) { // provide credentials for the request url
+                 Validate.isTrue(auth.url().getHost().equals("example.com"));
+                 // check that we're sending credentials were we expect, and not redirected out
+                 return auth.credentials("username", "password");
+             } else { // auth.isProxy()
+                 return auth.credentials("proxy-user", "proxy-password");
+             }
+         });
+
+     Connection.Response response = session.newRequest("https://example.com/adminzone/").execute();
+     </pre></code>
+     </p>
+
+     <p>The system may cache the authentication and use it for subsequent requests to the same resource.</p>
+
+     <p><b>Implementation notes</b></p>
+     <p>For compatibility, on a Java 8 platform, authentication is set up via the system-wide default
+     {@link java.net.Authenticator#setDefault(Authenticator)} method via a ThreadLocal delegator. Whilst the
+     authenticator used is request specific and thread-safe, if you have other calls to {@code setDefault}, they will be
+     incompatible with this implementation.</p>
+     <p>On Java 9 and above, the preceding note does not apply; authenticators are directly set on the request. </p>
+     <p>If you are attempting to authenticate to a proxy that uses the {@code basic} scheme and will be fetching HTTPS
+     URLs, you need to configure your Java platform to enable that, by setting the
+     {@code jdk.http.auth.tunneling.disabledSchemes} system property to {@code ""}.
+     This must be executed prior to any authorization attempts. E.g.:
+     <code><pre>
+     static {
+        System.setProperty("jdk.http.auth.tunneling.disabledSchemes", "");
+        // removes Basic, which is otherwise excluded from auth for CONNECT tunnels
+     }</pre></code>
+     </p>
+     * @param authenticator the authenticator to use in this connection
+     * @return this Connection, for chaining
+     * @since 1.17.1
+     */
+    default Connection auth(@Nullable RequestAuthenticator authenticator) {
+        throw new UnsupportedOperationException();
+    }
+
     /**
      * Execute the request as a GET, and parse the result.
      * @return parsed Document
-     * @throws java.net.MalformedURLException if the request URL is not a HTTP or HTTPS URL, or is otherwise malformed
+     * @throws java.net.MalformedURLException if the request URL is not an HTTP or HTTPS URL, or is otherwise malformed
      * @throws HttpStatusException if the response is not OK and HTTP response errors are not ignored
      * @throws UnsupportedMimeTypeException if the response mime type is not supported and those errors are not ignored
      * @throws java.net.SocketTimeoutException if the connection times out
@@ -341,7 +429,7 @@ <p>For GET requests, data parameters will be sent on the request query string. F
 
     /**
      * Execute the request.
-     * @return a response object
+     * @return the executed {@link Response}
      * @throws java.net.MalformedURLException if the request URL is not a HTTP or HTTPS URL, or is otherwise malformed
      * @throws HttpStatusException if the response is not OK and HTTP response errors are not ignored
      * @throws UnsupportedMimeTypeException if the response mime type is not supported and those errors are not ignored
@@ -650,7 +738,7 @@ interface Request extends Base<Request> {
         Collection<KeyVal> data();
 
         /**
-         * Set a POST (or PUT) request body. Useful when a server expects a plain request body, not a set for URL
+         * Set a POST (or PUT) request body. Useful when a server expects a plain request body, not a set of URL
          * encoded form key/value pairs. E.g.:
          * <code><pre>Jsoup.connect(url)
          * .requestBody(json)
@@ -694,6 +782,27 @@ interface Request extends Base<Request> {
          */
         String postDataCharset();
 
+        /**
+         Set the authenticator to use for this request.
+         See {@link Connection#auth(RequestAuthenticator) Connection.auth(authenticator)} for examples and
+         implementation notes.
+         * @param authenticator the authenticator
+         * @return this Request, for chaining.
+         * @since 1.17.1
+         */
+        default Request auth(@Nullable RequestAuthenticator authenticator)  {
+            throw new UnsupportedOperationException();
+        }
+
+        /**
+         Get the RequestAuthenticator, if any, that will be used on this request.
+         * @return the RequestAuthenticator, or {@code null} if not set
+         * @since 1.17.1
+         */
+        @Nullable
+        default RequestAuthenticator auth() {
+            throw new UnsupportedOperationException();
+        }
     }
 
     /**
@@ -754,18 +863,24 @@ interface Response extends Base<Response> {
 
         /**
          * Read the body of the response into a local buffer, so that {@link #parse()} may be called repeatedly on the
-         * same connection response (otherwise, once the response is read, its InputStream will have been drained and
-         * may not be re-read). Calling {@link #body() } or {@link #bodyAsBytes()} has the same effect.
+         * same connection response. Otherwise, once the response is read, its InputStream will have been drained and
+         * may not be re-read.
+         * <p>Calling {@link #body() } or {@link #bodyAsBytes()} has the same effect.</p>
          * @return this response, for chaining
          * @throws UncheckedIOException if an IO exception occurs during buffering.
          */
         Response bufferUp();
 
         /**
-         * Get the body of the response as a (buffered) InputStream. You should close the input stream when you're done with it.
-         * Other body methods (like bufferUp, body, parse, etc) will not work in conjunction with this method.
-         * <p>This method is useful for writing large responses to disk, without buffering them completely into memory first.</p>
-         * @return the response body input stream
+         Get the body of the response as a (buffered) InputStream. You should close the input stream when you're done
+         with it.
+         <p>Other body methods (like bufferUp, body, parse, etc) will generally not work in conjunction with this method,
+         as it consumes the InputStream.</p>
+         <p>Any configured max size or maximum read timeout applied to the connection will not be applied to this stream,
+         unless {@link #bufferUp()} is called prior.</p>
+         <p>This method is useful for writing large responses to disk, without buffering them completely into memory
+         first.</p>
+         @return the response body input stream
          */
         BufferedInputStream bodyStream();
     }
diff --git a/src/main/java/org/jsoup/Jsoup.java b/src/main/java/org/jsoup/Jsoup.java
index b4a99ebcb1..29acbafbc4 100644
--- a/src/main/java/org/jsoup/Jsoup.java
+++ b/src/main/java/org/jsoup/Jsoup.java
@@ -7,9 +7,7 @@
 import org.jsoup.parser.Parser;
 import org.jsoup.safety.Cleaner;
 import org.jsoup.safety.Safelist;
-
-import javax.annotation.Nullable;
-import javax.annotation.WillClose;
+import org.jspecify.annotations.Nullable;
 
 import java.io.File;
 import java.io.IOException;
@@ -196,7 +194,7 @@ public static Document parse(File file, @Nullable String charsetName, String bas
 
      @throws IOException if the file could not be found, or read, or if the charsetName is invalid.
      */
-    public static Document parse(@WillClose InputStream in, @Nullable String charsetName, String baseUri) throws IOException {
+    public static Document parse(InputStream in, @Nullable String charsetName, String baseUri) throws IOException {
         return DataUtil.load(in, charsetName, baseUri);
     }
 
diff --git a/src/main/java/org/jsoup/helper/AuthenticationHandler.java b/src/main/java/org/jsoup/helper/AuthenticationHandler.java
new file mode 100644
index 0000000000..bd3e6e1ba7
--- /dev/null
+++ b/src/main/java/org/jsoup/helper/AuthenticationHandler.java
@@ -0,0 +1,91 @@
+package org.jsoup.helper;
+
+import org.jspecify.annotations.Nullable;
+
+import java.lang.reflect.Constructor;
+import java.net.Authenticator;
+import java.net.HttpURLConnection;
+import java.net.PasswordAuthentication;
+
+/**
+ Handles per request Authenticator-based authentication. Loads the class `org.jsoup.helper.RequestAuthHandler` if
+ per-request Authenticators are supported (Java 9+), or installs a system-wide Authenticator that delegates to a request
+ ThreadLocal.
+ */
+class AuthenticationHandler extends Authenticator {
+    static final int MaxAttempts = 5; // max authentication attempts per request. allows for multiple auths (e.g. proxy and server) in one request, but saves otherwise 20 requests if credentials are incorrect.
+    static AuthShim handler;
+
+    static {
+        try {
+            //noinspection unchecked
+            Class<AuthShim> perRequestClass = (Class<AuthShim>) Class.forName("org.jsoup.helper.RequestAuthHandler");
+            Constructor<AuthShim> constructor = perRequestClass.getConstructor();
+            handler = constructor.newInstance();
+        } catch (ClassNotFoundException e) {
+            handler = new GlobalHandler();
+        } catch (Exception e) {
+            throw new IllegalStateException(e);
+        }
+    }
+
+    @Nullable RequestAuthenticator auth;
+    int attemptCount = 0;
+
+    AuthenticationHandler() {}
+
+    AuthenticationHandler(RequestAuthenticator auth) {
+        this.auth = auth;
+    }
+
+    /**
+     Authentication callback, called by HttpURLConnection - either as system-wide default (Java 8) or per HttpURLConnection (Java 9+)
+     * @return credentials, or null if not attempting to auth.
+     */
+    @Nullable @Override public final PasswordAuthentication getPasswordAuthentication() {
+        AuthenticationHandler delegate = handler.get(this);
+        if (delegate == null) return null; // this request has no auth handler
+        delegate.attemptCount++;
+        // if the password returned fails, Java will repeatedly retry the request with a new password auth hit (because
+        // it may be an interactive prompt, and the user could eventually get it right). But in Jsoup's context, the
+        // auth will either be correct or not, so just abandon
+        if (delegate.attemptCount > MaxAttempts)
+            return null;
+        if (delegate.auth == null)
+            return null; // detached - would have been the Global Authenticator (not a delegate)
+
+        RequestAuthenticator.Context ctx = new RequestAuthenticator.Context(
+            this.getRequestingURL(), this.getRequestorType(), this.getRequestingPrompt());
+        return delegate.auth.authenticate(ctx);
+    }
+
+    interface AuthShim {
+        void enable(RequestAuthenticator auth, HttpURLConnection con);
+
+        void remove();
+
+        @Nullable AuthenticationHandler get(AuthenticationHandler helper);
+    }
+
+    /**
+     On Java 8 we install a system-wide Authenticator, which pulls the delegating Auth from a ThreadLocal pool.
+     */
+    static class GlobalHandler implements AuthShim {
+        static ThreadLocal<AuthenticationHandler> authenticators = new ThreadLocal<>();
+        static {
+            Authenticator.setDefault(new AuthenticationHandler());
+        }
+
+        @Override public void enable(RequestAuthenticator auth, HttpURLConnection con) {
+            authenticators.set(new AuthenticationHandler(auth));
+        }
+
+        @Override public void remove() {
+            authenticators.remove();
+        }
+
+        @Override public AuthenticationHandler get(AuthenticationHandler helper) {
+            return authenticators.get();
+        }
+    }
+}
diff --git a/src/main/java/org/jsoup/helper/DataUtil.java b/src/main/java/org/jsoup/helper/DataUtil.java
index 69e1f29893..c1c791053c 100644
--- a/src/main/java/org/jsoup/helper/DataUtil.java
+++ b/src/main/java/org/jsoup/helper/DataUtil.java
@@ -1,7 +1,8 @@
 package org.jsoup.helper;
 
-import org.jsoup.internal.ConstrainableInputStream;
+import org.jsoup.internal.ControllableInputStream;
 import org.jsoup.internal.Normalizer;
+import org.jsoup.internal.SharedConstants;
 import org.jsoup.internal.StringUtil;
 import org.jsoup.nodes.Comment;
 import org.jsoup.nodes.Document;
@@ -10,9 +11,7 @@
 import org.jsoup.nodes.XmlDeclaration;
 import org.jsoup.parser.Parser;
 import org.jsoup.select.Elements;
-
-import javax.annotation.Nullable;
-import javax.annotation.WillClose;
+import org.jspecify.annotations.Nullable;
 
 import java.io.BufferedReader;
 import java.io.CharArrayReader;
@@ -34,6 +33,8 @@
 import java.util.regex.Pattern;
 import java.util.zip.GZIPInputStream;
 
+import static org.jsoup.internal.SharedConstants.DefaultBufferSize;
+
 /**
  * Internal static utilities for handling data.
  *
@@ -44,7 +45,6 @@ public final class DataUtil {
     public static final Charset UTF_8 = Charset.forName("UTF-8"); // Don't use StandardCharsets, as those only appear in Android API 19, and we target 10.
     static final String defaultCharsetName = UTF_8.name(); // used if not found in header or meta charset
     private static final int firstReadBufferSize = 1024 * 5;
-    static final int bufferSize = 1024 * 32;
     private static final char[] mimeBoundaryChars =
             "-_1234567890abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ".toCharArray();
     static final int boundaryLength = 32;
@@ -105,7 +105,7 @@ public static Document load(File file, @Nullable String charsetName, String base
      * @return Document
      * @throws IOException on IO error
      */
-    public static Document load(@WillClose InputStream in, @Nullable String charsetName, String baseUri) throws IOException {
+    public static Document load(InputStream in, @Nullable String charsetName, String baseUri) throws IOException {
         return parseInputStream(in, charsetName, baseUri, Parser.htmlParser());
     }
 
@@ -118,7 +118,7 @@ public static Document load(@WillClose InputStream in, @Nullable String charsetN
      * @return Document
      * @throws IOException on IO error
      */
-    public static Document load(@WillClose InputStream in, @Nullable String charsetName, String baseUri, Parser parser) throws IOException {
+    public static Document load(InputStream in, @Nullable String charsetName, String baseUri, Parser parser) throws IOException {
         return parseInputStream(in, charsetName, baseUri, parser);
     }
 
@@ -129,23 +129,23 @@ public static Document load(@WillClose InputStream in, @Nullable String charsetN
      * @throws IOException on IO error
      */
     static void crossStreams(final InputStream in, final OutputStream out) throws IOException {
-        final byte[] buffer = new byte[bufferSize];
+        final byte[] buffer = new byte[DefaultBufferSize];
         int len;
         while ((len = in.read(buffer)) != -1) {
             out.write(buffer, 0, len);
         }
     }
 
-    static Document parseInputStream(@Nullable @WillClose InputStream input, @Nullable String charsetName, String baseUri, Parser parser) throws IOException  {
+    static Document parseInputStream(@Nullable InputStream input, @Nullable String charsetName, String baseUri, Parser parser) throws IOException  {
         if (input == null) // empty body
             return new Document(baseUri);
-        input = ConstrainableInputStream.wrap(input, bufferSize, 0);
+        input = ControllableInputStream.wrap(input, DefaultBufferSize, 0);
 
         @Nullable Document doc = null;
 
         // read the start of the stream and look for a BOM or meta charset
         try {
-            input.mark(bufferSize);
+            input.mark(DefaultBufferSize);
             ByteBuffer firstBytes = readToByteBuffer(input, firstReadBufferSize - 1); // -1 because we read one more to see if completed. First read is < buffer size, so can't be invalid.
             boolean fullyRead = (input.read() == -1);
             input.reset();
@@ -208,7 +208,7 @@ else if (first instanceof Comment) {
             if (doc == null) {
                 if (charsetName == null)
                     charsetName = defaultCharsetName;
-                BufferedReader reader = new BufferedReader(new InputStreamReader(input, Charset.forName(charsetName)), bufferSize); // Android level does not allow us try-with-resources
+                BufferedReader reader = new BufferedReader(new InputStreamReader(input, Charset.forName(charsetName)), DefaultBufferSize); // Android level does not allow us try-with-resources
                 try {
                     if (bomCharset != null && bomCharset.offset) { // creating the buffered reader ignores the input pos, so must skip here
                         long skipped = reader.skip(1);
@@ -247,9 +247,7 @@ else if (first instanceof Comment) {
      * @throws IOException if an exception occurs whilst reading from the input stream.
      */
     public static ByteBuffer readToByteBuffer(InputStream inStream, int maxSize) throws IOException {
-        Validate.isTrue(maxSize >= 0, "maxSize must be 0 (unlimited) or larger");
-        final ConstrainableInputStream input = ConstrainableInputStream.wrap(inStream, bufferSize, maxSize);
-        return input.readToByteBuffer(maxSize);
+        return ControllableInputStream.readToByteBuffer(inStream, maxSize);
     }
 
     static ByteBuffer emptyByteBuffer() {
diff --git a/src/main/java/org/jsoup/helper/HttpConnection.java b/src/main/java/org/jsoup/helper/HttpConnection.java
index 6bc52e1c7a..fc9467aeba 100644
--- a/src/main/java/org/jsoup/helper/HttpConnection.java
+++ b/src/main/java/org/jsoup/helper/HttpConnection.java
@@ -4,13 +4,14 @@
 import org.jsoup.HttpStatusException;
 import org.jsoup.UncheckedIOException;
 import org.jsoup.UnsupportedMimeTypeException;
-import org.jsoup.internal.ConstrainableInputStream;
+import org.jsoup.internal.ControllableInputStream;
+import org.jsoup.internal.SharedConstants;
 import org.jsoup.internal.StringUtil;
 import org.jsoup.nodes.Document;
 import org.jsoup.parser.Parser;
 import org.jsoup.parser.TokenQueue;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import javax.net.ssl.HttpsURLConnection;
 import javax.net.ssl.SSLSocketFactory;
 import java.io.BufferedInputStream;
@@ -111,7 +112,7 @@ private static String encodeMimeName(String val) {
     }
 
     private HttpConnection.Request req;
-    private @Nullable Connection.Response res;
+    private Connection.@Nullable Response res;
 
     @Override
     public Connection newRequest() {
@@ -377,6 +378,10 @@ public Connection postDataCharset(String charset) {
         return this;
     }
 
+    @Override public Connection auth(RequestAuthenticator authenticator) {
+        req.auth(authenticator);
+        return this;
+    }
 
     @SuppressWarnings("unchecked")
     private static abstract class Base<T extends Connection.Base<T>> implements Connection.Base<T> {
@@ -535,7 +540,7 @@ private List<String> getHeadersCaseInsensitive(String name) {
             return Collections.emptyList();
         }
 
-        private @Nullable Map.Entry<String, List<String>> scanHeaders(String name) {
+        private Map.@Nullable Entry<String, List<String>> scanHeaders(String name) {
             String lc = lowerCase(name);
             for (Map.Entry<String, List<String>> entry : headers.entrySet()) {
                 if (lowerCase(entry.getKey()).equals(lc))
@@ -596,6 +601,7 @@ public static class Request extends HttpConnection.Base<Connection.Request> impl
         private String postDataCharset = DataUtil.defaultCharsetName;
         private @Nullable SSLSocketFactory sslSocketFactory;
         private CookieManager cookieManager;
+        private @Nullable RequestAuthenticator authenticator;
         private volatile boolean executing = false;
 
         Request() {
@@ -626,6 +632,7 @@ public static class Request extends HttpConnection.Base<Connection.Request> impl
             parserDefined = copy.parserDefined;
             sslSocketFactory = copy.sslSocketFactory; // these are all synchronized so safe to share
             cookieManager = copy.cookieManager;
+            authenticator = copy.authenticator;
             executing = false;
         }
 
@@ -764,6 +771,15 @@ public String postDataCharset() {
         CookieManager cookieManager() {
             return cookieManager;
         }
+
+        @Override public Connection.Request auth(@Nullable RequestAuthenticator authenticator) {
+            this.authenticator = authenticator;
+            return this;
+        }
+
+        @Override @Nullable public RequestAuthenticator auth() {
+            return authenticator;
+        }
     }
 
     public static class Response extends HttpConnection.Base<Connection.Response> implements Connection.Response {
@@ -772,7 +788,7 @@ public static class Response extends HttpConnection.Base<Connection.Response> im
         private final int statusCode;
         private final String statusMessage;
         private @Nullable ByteBuffer byteData;
-        private @Nullable InputStream bodyStream;
+        private @Nullable ControllableInputStream bodyStream;
         private @Nullable HttpURLConnection conn;
         private @Nullable String charset;
         private @Nullable final String contentType;
@@ -782,9 +798,9 @@ public static class Response extends HttpConnection.Base<Connection.Response> im
         private final HttpConnection.Request req;
 
         /*
-         * Matches XML content types (like text/xml, application/xhtml+xml;charset=UTF8, etc)
+         * Matches XML content types (like text/xml, image/svg+xml, application/xhtml+xml;charset=UTF8, etc)
          */
-        private static final Pattern xmlContentTypeRxp = Pattern.compile("(application|text)/\\w*\\+?xml.*");
+        private static final Pattern xmlContentTypeRxp = Pattern.compile("(\\w+)/\\w*\\+?xml.*");
 
         /**
          <b>Internal only! </b>Creates a dummy HttpConnection.Response, useful for testing. All actual responses
@@ -869,7 +885,7 @@ else if (methodHasBody)
                         && !contentType.startsWith("text/")
                         && !xmlContentTypeRxp.matcher(contentType).matches()
                         )
-                    throw new UnsupportedMimeTypeException("Unhandled content type. Must be text/*, application/xml, or application/*+xml",
+                    throw new UnsupportedMimeTypeException("Unhandled content type. Must be text/*, */xml, or */*+xml",
                             contentType, req.url().toString());
 
                 // switch to the XML parser if content type is xml and not parser not explicitly set
@@ -879,17 +895,15 @@ else if (methodHasBody)
 
                 res.charset = DataUtil.getCharsetFromContentType(res.contentType); // may be null, readInputStream deals with it
                 if (conn.getContentLength() != 0 && req.method() != HEAD) { // -1 means unknown, chunked. sun throws an IO exception on 500 response with no content when trying to read body
-                    res.bodyStream = conn.getErrorStream() != null ? conn.getErrorStream() : conn.getInputStream();
-                    Validate.notNull(res.bodyStream);
-                    if (res.hasHeaderWithValue(CONTENT_ENCODING, "gzip")) {
-                        res.bodyStream = new GZIPInputStream(res.bodyStream);
-                    } else if (res.hasHeaderWithValue(CONTENT_ENCODING, "deflate")) {
-                        res.bodyStream = new InflaterInputStream(res.bodyStream, new Inflater(true));
-                    }
-                    res.bodyStream = ConstrainableInputStream
-                        .wrap(res.bodyStream, DataUtil.bufferSize, req.maxBodySize())
-                        .timeout(startTime, req.timeout())
-                    ;
+                    InputStream stream = conn.getErrorStream() != null ? conn.getErrorStream() : conn.getInputStream();
+                    if (res.hasHeaderWithValue(CONTENT_ENCODING, "gzip"))
+                        stream = new GZIPInputStream(stream);
+                    else if (res.hasHeaderWithValue(CONTENT_ENCODING, "deflate"))
+                        stream = new InflaterInputStream(stream, new Inflater(true));
+                    
+                    res.bodyStream = ControllableInputStream.wrap(
+                        stream, SharedConstants.DefaultBufferSize, req.maxBodySize())
+                        .timeout(startTime, req.timeout());
                 } else {
                     res.byteData = DataUtil.emptyByteBuffer();
                 }
@@ -898,6 +912,10 @@ else if (methodHasBody)
                 throw e;
             } finally {
                 req.executing = false;
+
+                // detach any thread local auth delegate
+                if (req.authenticator != null)
+                    AuthenticationHandler.handler.remove();
             }
 
             res.executed = true;
@@ -932,12 +950,13 @@ public String contentType() {
 
         public Document parse() throws IOException {
             Validate.isTrue(executed, "Request must be executed (with .execute(), .get(), or .post() before parsing response");
+            InputStream stream = bodyStream;
             if (byteData != null) { // bytes have been read in to the buffer, parse that
-                bodyStream = new ByteArrayInputStream(byteData.array());
+                stream = new ByteArrayInputStream(byteData.array());
                 inputStreamRead = false; // ok to reparse if in bytes
             }
             Validate.isFalse(inputStreamRead, "Input stream already read and parsed, cannot re-read.");
-            Document doc = DataUtil.parseInputStream(bodyStream, charset, url.toExternalForm(), req.parser());
+            Document doc = DataUtil.parseInputStream(stream, charset, url.toExternalForm(), req.parser());
             doc.connection(new HttpConnection(req, this)); // because we're static, don't have the connection obj. // todo - maybe hold in the req?
             charset = doc.outputSettings().charset().name(); // update charset from meta-equiv, possibly
             inputStreamRead = true;
@@ -987,9 +1006,16 @@ public Connection.Response bufferUp() {
         @Override
         public BufferedInputStream bodyStream() {
             Validate.isTrue(executed, "Request must be executed (with .execute(), .get(), or .post() before getting response body");
+
+            // if we have read to bytes (via buffer up), return those as a stream.
+            if (byteData != null) {
+                return new BufferedInputStream(new ByteArrayInputStream(byteData.array()), SharedConstants.DefaultBufferSize);
+            }
+
             Validate.isFalse(inputStreamRead, "Request has already been read");
+            Validate.notNull(bodyStream);
             inputStreamRead = true;
-            return ConstrainableInputStream.wrap(bodyStream, DataUtil.bufferSize, req.maxBodySize());
+            return bodyStream.inputStream();
         }
 
         // set up connection defaults, and details from request
@@ -1008,6 +1034,8 @@ private static HttpURLConnection createConnection(HttpConnection.Request req) th
 
             if (req.sslSocketFactory() != null && conn instanceof HttpsURLConnection)
                 ((HttpsURLConnection) conn).setSSLSocketFactory(req.sslSocketFactory());
+            if (req.authenticator != null)
+                AuthenticationHandler.handler.enable(req.authenticator, conn); // removed in finally
             if (req.method().hasBody())
                 conn.setDoOutput(true);
             CookieUtil.applyCookiesToRequest(req, conn); // from the Request key/val cookies and the Cookie Store
@@ -1040,7 +1068,7 @@ private void safeClose() {
         }
 
         // set up url, method, header, cookies
-        private Response(HttpURLConnection conn, HttpConnection.Request request, @Nullable HttpConnection.Response previousResponse) throws IOException {
+        private Response(HttpURLConnection conn, HttpConnection.Request request, HttpConnection.@Nullable Response previousResponse) throws IOException {
             this.conn = conn;
             this.req = request;
             method = Method.valueOf(conn.getRequestMethod());
diff --git a/src/main/java/org/jsoup/helper/RequestAuthenticator.java b/src/main/java/org/jsoup/helper/RequestAuthenticator.java
new file mode 100644
index 0000000000..7b4adc40ec
--- /dev/null
+++ b/src/main/java/org/jsoup/helper/RequestAuthenticator.java
@@ -0,0 +1,92 @@
+package org.jsoup.helper;
+
+import org.jsoup.Connection;
+import org.jspecify.annotations.Nullable;
+
+import java.net.Authenticator;
+import java.net.PasswordAuthentication;
+import java.net.URL;
+
+/**
+ A {@code RequestAuthenticator} is used in {@link Connection} to authenticate if required to proxies and web
+ servers. See {@link Connection#auth(RequestAuthenticator)}.
+ */
+@FunctionalInterface
+public interface RequestAuthenticator {
+
+    /**
+     Provide authentication credentials for the provided Request Context.
+     * @param auth the request context including URL, type (Server or Proxy), and realm.
+     * @return credentials for the request. May return {@code null} if they are not applicable -- but the request will
+     * likely fail, as this method is only called if the request asked for authentication.
+     */
+    @Nullable
+    PasswordAuthentication authenticate(Context auth);
+
+    /**
+     Provides details for the request, to determine the appropriate credentials to return.
+     */
+    class Context {
+        private final URL url;
+        private final Authenticator.RequestorType type;
+        private final String realm;
+
+        Context(URL url, Authenticator.RequestorType type, String realm) {
+            this.url = url;
+            this.type = type;
+            this.realm = realm;
+        }
+
+        /**
+         Get he URL that is being requested.
+         * @return URL
+         */
+        public URL url() {
+            return url;
+        }
+
+        /**
+         Get the requestor type: {@link Authenticator.RequestorType#PROXY PROXY} if a proxy is requesting
+         authentication, or {@link Authenticator.RequestorType#SERVER SERVER} if the URL's server is requesting.
+         * @return requestor type
+         */
+        public Authenticator.RequestorType type() {
+            return type;
+        }
+
+        /**
+         Get the realm of the authentication request.
+         * @return realm of the authentication request
+         */
+        public String realm() {
+            return realm;
+        }
+
+        /**
+         Gets if the authentication request is for a proxy.
+         * @return true if type==proxy.
+         */
+        public boolean isProxy() {
+            return type == Authenticator.RequestorType.PROXY;
+        }
+
+        /**
+         Gets if the authentication request is for a server.
+         * @return true if type==server.
+         */
+        public boolean isServer() {
+            return type == Authenticator.RequestorType.SERVER;
+        }
+
+        /**
+         Helper method to return a PasswordAuthentication object.
+         * @param username username credential
+         * @param password password credential
+         * @return a constructed PasswordAuthentication
+         */
+        public PasswordAuthentication credentials(String username, String password) {
+            return new PasswordAuthentication(username, password.toCharArray());
+        }
+    }
+
+}
diff --git a/src/main/java/org/jsoup/helper/UrlBuilder.java b/src/main/java/org/jsoup/helper/UrlBuilder.java
index 3ef9c56870..30213d3768 100644
--- a/src/main/java/org/jsoup/helper/UrlBuilder.java
+++ b/src/main/java/org/jsoup/helper/UrlBuilder.java
@@ -2,8 +2,8 @@
 
 import org.jsoup.Connection;
 import org.jsoup.internal.StringUtil;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.UnsupportedEncodingException;
 import java.net.IDN;
 import java.net.MalformedURLException;
diff --git a/src/main/java/org/jsoup/helper/Validate.java b/src/main/java/org/jsoup/helper/Validate.java
index 1270b8cc90..c956697380 100644
--- a/src/main/java/org/jsoup/helper/Validate.java
+++ b/src/main/java/org/jsoup/helper/Validate.java
@@ -1,6 +1,6 @@
 package org.jsoup.helper;
 
-import javax.annotation.Nullable;
+import org.jspecify.annotations.Nullable;
 
 /**
  * Validators to check that method arguments meet expectations. 
diff --git a/src/main/java/org/jsoup/helper/W3CDom.java b/src/main/java/org/jsoup/helper/W3CDom.java
index 3070d1024d..6ce0abd9e5 100644
--- a/src/main/java/org/jsoup/helper/W3CDom.java
+++ b/src/main/java/org/jsoup/helper/W3CDom.java
@@ -17,8 +17,8 @@
 import org.w3c.dom.Node;
 import org.w3c.dom.NodeList;
 import org.w3c.dom.Text;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import javax.xml.parsers.DocumentBuilder;
 import javax.xml.parsers.DocumentBuilderFactory;
 import javax.xml.parsers.ParserConfigurationException;
@@ -207,8 +207,12 @@ public Document fromJsoup(org.jsoup.nodes.Element in) {
             org.jsoup.nodes.Document inDoc = in.ownerDocument();
             org.jsoup.nodes.DocumentType doctype = inDoc != null ? inDoc.documentType() : null;
             if (doctype != null) {
-                org.w3c.dom.DocumentType documentType = impl.createDocumentType(doctype.name(), doctype.publicId(), doctype.systemId());
-                out.appendChild(documentType);
+                try {
+                    org.w3c.dom.DocumentType documentType = impl.createDocumentType(doctype.name(), doctype.publicId(), doctype.systemId());
+                    out.appendChild(documentType);
+                } catch (DOMException ignored) {
+                    // invalid / empty doctype dropped
+                }
             }
             out.setXmlStandalone(true);
             // if in is Document, use the root element, not the wrapping document, as the context:
@@ -349,7 +353,7 @@ protected static class W3CBuilder implements NodeVisitor {
         private final Stack<HashMap<String, String>> namespacesStack = new Stack<>(); // stack of namespaces, prefix => urn
         private Node dest;
         private Syntax syntax = Syntax.xml; // the syntax (to coerce attributes to). From the input doc if available.
-        @Nullable private final org.jsoup.nodes.Element contextElement;
+        /*@Nullable*/ private final org.jsoup.nodes.Element contextElement; // todo - unsure why this can't be marked nullable?
 
         public W3CBuilder(Document doc) {
             this.doc = doc;
diff --git a/src/main/java/org/jsoup/helper/package-info.java b/src/main/java/org/jsoup/helper/package-info.java
index 2074b7aafa..8a8f998f97 100644
--- a/src/main/java/org/jsoup/helper/package-info.java
+++ b/src/main/java/org/jsoup/helper/package-info.java
@@ -1,7 +1,7 @@
 /**
  Package containing classes supporting the core jsoup code.
  */
-@NonnullByDefault
+@NullMarked
 package org.jsoup.helper;
 
-import org.jsoup.internal.NonnullByDefault;
+import org.jspecify.annotations.NullMarked;
diff --git a/src/main/java/org/jsoup/internal/ConstrainableInputStream.java b/src/main/java/org/jsoup/internal/ConstrainableInputStream.java
index aa2c275127..8f382ea042 100644
--- a/src/main/java/org/jsoup/internal/ConstrainableInputStream.java
+++ b/src/main/java/org/jsoup/internal/ConstrainableInputStream.java
@@ -1,9 +1,9 @@
 package org.jsoup.internal;
 
+import org.jsoup.helper.DataUtil;
 import org.jsoup.helper.Validate;
 
 import java.io.BufferedInputStream;
-import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.io.InputStream;
 import java.net.SocketTimeoutException;
@@ -12,10 +12,10 @@
 /**
  * A jsoup internal class (so don't use it as there is no contract API) that enables constraints on an Input Stream,
  * namely a maximum read size, and the ability to Thread.interrupt() the read.
+ * @deprecated use {@link ControllableInputStream} instead (but don't use that either, because this is jsoup internal!)
  */
+@Deprecated
 public final class ConstrainableInputStream extends BufferedInputStream {
-    private static final int DefaultSize = 1024 * 32;
-
     private final boolean capped;
     private final int maxSize;
     private long startTime;
@@ -74,27 +74,7 @@ public int read(byte[] b, int off, int len) throws IOException {
      * reading just the first bytes.
      */
     public ByteBuffer readToByteBuffer(int max) throws IOException {
-        Validate.isTrue(max >= 0, "maxSize must be 0 (unlimited) or larger");
-        final boolean localCapped = max > 0; // still possibly capped in total stream
-        final int bufferSize = localCapped && max < DefaultSize ? max : DefaultSize;
-        final byte[] readBuffer = new byte[bufferSize];
-        final ByteArrayOutputStream outStream = new ByteArrayOutputStream(bufferSize);
-
-        int read;
-        int remaining = max;
-        while (true) {
-            read = read(readBuffer, 0, localCapped ? Math.min(remaining, bufferSize) : bufferSize);
-            if (read == -1) break;
-            if (localCapped) { // this local byteBuffer cap may be smaller than the overall maxSize (like when reading first bytes)
-                if (read >= remaining) {
-                    outStream.write(readBuffer, 0, remaining);
-                    break;
-                }
-                remaining -= read;
-            }
-            outStream.write(readBuffer, 0, read);
-        }
-        return ByteBuffer.wrap(outStream.toByteArray());
+        return DataUtil.readToByteBuffer(this, max);
     }
 
     @Override
diff --git a/src/main/java/org/jsoup/internal/ControllableInputStream.java b/src/main/java/org/jsoup/internal/ControllableInputStream.java
new file mode 100644
index 0000000000..7f73e5807a
--- /dev/null
+++ b/src/main/java/org/jsoup/internal/ControllableInputStream.java
@@ -0,0 +1,141 @@
+package org.jsoup.internal;
+
+import org.jsoup.helper.DataUtil;
+import org.jsoup.helper.Validate;
+
+import java.io.BufferedInputStream;
+import java.io.ByteArrayOutputStream;
+import java.io.FilterInputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.net.SocketTimeoutException;
+import java.nio.ByteBuffer;
+
+import static org.jsoup.internal.SharedConstants.DefaultBufferSize;
+
+/**
+ * A jsoup internal class (so don't use it as there is no contract API) that enables controls on a Buffered Input Stream,
+ * namely a maximum read size, and the ability to Thread.interrupt() the read.
+ */
+// reimplemented from ConstrainableInputStream for JDK21 - extending BufferedInputStream will pin threads during read
+public class ControllableInputStream extends FilterInputStream {
+    private final BufferedInputStream buff;
+    private final boolean capped;
+    private final int maxSize;
+    private long startTime;
+    private long timeout = 0; // optional max time of request
+    private int remaining;
+    private int markPos;
+    private boolean interrupted;
+
+    private ControllableInputStream(BufferedInputStream in, int maxSize) {
+        super(in);
+        Validate.isTrue(maxSize >= 0);
+        buff = in;
+        capped = maxSize != 0;
+        this.maxSize = maxSize;
+        remaining = maxSize;
+        markPos = -1;
+        startTime = System.nanoTime();
+    }
+
+    /**
+     * If this InputStream is not already a ControllableInputStream, let it be one.
+     * @param in the input stream to (maybe) wrap
+     * @param bufferSize the buffer size to use when reading
+     * @param maxSize the maximum size to allow to be read. 0 == infinite.
+     * @return a controllable input stream
+     */
+    public static ControllableInputStream wrap(InputStream in, int bufferSize, int maxSize) {
+        if (in instanceof ControllableInputStream)
+            return (ControllableInputStream) in;
+        else if (in instanceof BufferedInputStream)
+            return new ControllableInputStream((BufferedInputStream) in, maxSize);
+        else
+            return new ControllableInputStream(new BufferedInputStream(in, bufferSize), maxSize);
+    }
+
+    @Override
+    public int read(byte[] b, int off, int len) throws IOException {
+        if (interrupted || capped && remaining <= 0)
+            return -1;
+        if (Thread.currentThread().isInterrupted()) {
+            // interrupted latches, because parse() may call twice
+            interrupted = true;
+            return -1;
+        }
+        if (expired())
+            throw new SocketTimeoutException("Read timeout");
+
+        if (capped && len > remaining)
+            len = remaining; // don't read more than desired, even if available
+
+        try {
+            final int read = super.read(b, off, len);
+            remaining -= read;
+            return read;
+        } catch (SocketTimeoutException e) {
+            return 0;
+        }
+    }
+
+    /**
+     * Reads this inputstream to a ByteBuffer. The supplied max may be less than the inputstream's max, to support
+     * reading just the first bytes.
+     */
+    public static ByteBuffer readToByteBuffer(InputStream in, int max) throws IOException {
+        Validate.isTrue(max >= 0, "maxSize must be 0 (unlimited) or larger");
+        Validate.notNull(in);
+        final boolean localCapped = max > 0; // still possibly capped in total stream
+        final int bufferSize = localCapped && max < DefaultBufferSize ? max : DefaultBufferSize;
+        final byte[] readBuffer = new byte[bufferSize];
+        final ByteArrayOutputStream outStream = new ByteArrayOutputStream(bufferSize);
+
+        int read;
+        int remaining = max;
+        while (true) {
+            read = in.read(readBuffer, 0, localCapped ? Math.min(remaining, bufferSize) : bufferSize);
+            if (read == -1) break;
+            if (localCapped) { // this local byteBuffer cap may be smaller than the overall maxSize (like when reading first bytes)
+                if (read >= remaining) {
+                    outStream.write(readBuffer, 0, remaining);
+                    break;
+                }
+                remaining -= read;
+            }
+            outStream.write(readBuffer, 0, read);
+        }
+        return ByteBuffer.wrap(outStream.toByteArray());
+    }
+
+    @SuppressWarnings("NonSynchronizedMethodOverridesSynchronizedMethod") // not synchronized in later JDKs
+    @Override public void reset() throws IOException {
+        super.reset();
+        remaining = maxSize - markPos;
+    }
+
+    @SuppressWarnings("NonSynchronizedMethodOverridesSynchronizedMethod") // not synchronized in later JDKs
+    @Override public void mark(int readlimit) {
+        super.mark(readlimit);
+        markPos = maxSize - remaining;
+    }
+
+    public ControllableInputStream timeout(long startTimeNanos, long timeoutMillis) {
+        this.startTime = startTimeNanos;
+        this.timeout = timeoutMillis * 1000000;
+        return this;
+    }
+
+    private boolean expired() {
+        if (timeout == 0)
+            return false;
+
+        final long now = System.nanoTime();
+        final long dur = now - startTime;
+        return (dur > timeout);
+    }
+
+    public BufferedInputStream inputStream() {
+        return buff;
+    }
+}
diff --git a/src/main/java/org/jsoup/internal/FieldsAreNonnullByDefault.java b/src/main/java/org/jsoup/internal/FieldsAreNonnullByDefault.java
index 56d4b86927..9e099b4ee5 100644
--- a/src/main/java/org/jsoup/internal/FieldsAreNonnullByDefault.java
+++ b/src/main/java/org/jsoup/internal/FieldsAreNonnullByDefault.java
@@ -1,19 +1,17 @@
 package org.jsoup.internal;
 
-import javax.annotation.Nonnull;
-import javax.annotation.meta.TypeQualifierDefault;
+import org.jspecify.annotations.NullMarked;
+
 import java.lang.annotation.Documented;
-import java.lang.annotation.ElementType;
 import java.lang.annotation.Retention;
 import java.lang.annotation.RetentionPolicy;
 
 /**
- Indicates that fields types are not nullable, unless otherwise specified by @Nullable.
- @see javax.annotation.ParametersAreNonnullByDefault
+ @deprecated Previously indicated that fields types are not nullable, unless otherwise specified by @Nullable.
  */
+@Deprecated
 @Documented
-@Nonnull
-@TypeQualifierDefault(ElementType.FIELD)
+@NullMarked
 @Retention(value = RetentionPolicy.CLASS)
 public @interface FieldsAreNonnullByDefault {
 }
diff --git a/src/main/java/org/jsoup/internal/NonnullByDefault.java b/src/main/java/org/jsoup/internal/NonnullByDefault.java
index 869f9fea8c..cda055d4f2 100644
--- a/src/main/java/org/jsoup/internal/NonnullByDefault.java
+++ b/src/main/java/org/jsoup/internal/NonnullByDefault.java
@@ -1,19 +1,17 @@
 package org.jsoup.internal;
 
-import javax.annotation.Nonnull;
-import javax.annotation.meta.TypeQualifierDefault;
+import org.jspecify.annotations.NullMarked;
+
 import java.lang.annotation.Documented;
-import java.lang.annotation.ElementType;
 import java.lang.annotation.Retention;
 import java.lang.annotation.RetentionPolicy;
 
 /**
- Indicates that all components (methods, returns, fields) are not nullable, unless otherwise specified by @Nullable.
- @see javax.annotation.ParametersAreNonnullByDefault
+ @deprecated Previously indicated that all components (methods, returns, fields) are not nullable, unless otherwise specified by @Nullable.
  */
+@Deprecated
 @Documented
-@Nonnull
-@TypeQualifierDefault({ElementType.METHOD, ElementType.PARAMETER, ElementType.FIELD})
+@NullMarked
 @Retention(value = RetentionPolicy.CLASS)
 public @interface NonnullByDefault {
 }
diff --git a/src/main/java/org/jsoup/internal/ReturnsAreNonnullByDefault.java b/src/main/java/org/jsoup/internal/ReturnsAreNonnullByDefault.java
index 3846135116..d218d6cb7a 100644
--- a/src/main/java/org/jsoup/internal/ReturnsAreNonnullByDefault.java
+++ b/src/main/java/org/jsoup/internal/ReturnsAreNonnullByDefault.java
@@ -1,19 +1,17 @@
 package org.jsoup.internal;
 
-import javax.annotation.Nonnull;
-import javax.annotation.meta.TypeQualifierDefault;
+import org.jspecify.annotations.NullMarked;
+
 import java.lang.annotation.Documented;
-import java.lang.annotation.ElementType;
 import java.lang.annotation.Retention;
 import java.lang.annotation.RetentionPolicy;
 
 /**
- Indicates return types are not nullable, unless otherwise specified by @Nullable.
- @see javax.annotation.ParametersAreNonnullByDefault
+ @deprecated Previously indicated that return types are not nullable, unless otherwise specified by @Nullable.
  */
+@Deprecated
 @Documented
-@Nonnull
-@TypeQualifierDefault(ElementType.METHOD)
+@NullMarked
 @Retention(value = RetentionPolicy.RUNTIME)
 public @interface ReturnsAreNonnullByDefault {
 }
diff --git a/src/main/java/org/jsoup/internal/SharedConstants.java b/src/main/java/org/jsoup/internal/SharedConstants.java
new file mode 100644
index 0000000000..141e1df9a8
--- /dev/null
+++ b/src/main/java/org/jsoup/internal/SharedConstants.java
@@ -0,0 +1,16 @@
+package org.jsoup.internal;
+
+/**
+ jsoup constants used between packages. Do not use as they may change without warning. Users will not be able to see
+ this package when modules are enabled.
+ */
+public final class SharedConstants {
+    public static final String UserDataKey = "/jsoup.userdata";
+    public final static String AttrRangeKey = "jsoup.attrs";
+    public static final String RangeKey = "jsoup.start";
+    public static final String EndRangeKey = "jsoup.end";
+
+    public static final int DefaultBufferSize = 1024 * 32;
+
+    private SharedConstants() {}
+}
diff --git a/src/main/java/org/jsoup/internal/StringUtil.java b/src/main/java/org/jsoup/internal/StringUtil.java
index 059c0ba9bc..85e104ef16 100644
--- a/src/main/java/org/jsoup/internal/StringUtil.java
+++ b/src/main/java/org/jsoup/internal/StringUtil.java
@@ -1,8 +1,8 @@
 package org.jsoup.internal;
 
 import org.jsoup.helper.Validate;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.net.MalformedURLException;
 import java.net.URL;
 import java.util.Arrays;
diff --git a/src/main/java/org/jsoup/internal/package-info.java b/src/main/java/org/jsoup/internal/package-info.java
index 8fdca179b2..739c6b8fed 100644
--- a/src/main/java/org/jsoup/internal/package-info.java
+++ b/src/main/java/org/jsoup/internal/package-info.java
@@ -2,4 +2,7 @@
  * Util methods used by Jsoup. Please don't depend on the APIs implemented here as the contents may change without
  * notice.
  */
+@NullMarked
 package org.jsoup.internal;
+
+import org.jspecify.annotations.NullMarked;
diff --git a/src/main/java/org/jsoup/nodes/Attribute.java b/src/main/java/org/jsoup/nodes/Attribute.java
index 56a34b49bf..f77106db1d 100644
--- a/src/main/java/org/jsoup/nodes/Attribute.java
+++ b/src/main/java/org/jsoup/nodes/Attribute.java
@@ -3,10 +3,11 @@
 import org.jsoup.SerializationException;
 import org.jsoup.helper.Validate;
 import org.jsoup.internal.Normalizer;
+import org.jsoup.internal.SharedConstants;
 import org.jsoup.internal.StringUtil;
 import org.jsoup.nodes.Document.OutputSettings.Syntax;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.util.Arrays;
 import java.util.Map;
@@ -99,7 +100,7 @@ public boolean hasDeclaredValue() {
      @param val the new attribute value; may be null (to set an enabled boolean attribute)
      @return the previous value (if was null; an empty string)
      */
-    public String setValue(@Nullable String val) {
+    @Override public String setValue(@Nullable String val) {
         String oldVal = this.val;
         if (parent != null) {
             int i = parent.indexOfKey(this.key);
@@ -127,6 +128,23 @@ public String html() {
         return StringUtil.releaseBuilder(sb);
     }
 
+    /**
+     Get the source ranges (start to end positions) in the original input source from which this attribute's <b>name</b>
+     and <b>value</b> were parsed.
+     <p>Position tracking must be enabled prior to parsing the content.</p>
+     @return the ranges for the attribute's name and value, or {@code untracked} if the attribute does not exist or its range
+     was not tracked.
+     @see org.jsoup.parser.Parser#setTrackPosition(boolean)
+     @see Attributes#sourceRange(String)
+     @see Node#sourceRange()
+     @see Element#endSourceRange()
+     @since 1.17.1
+     */
+    public Range.AttributeRange sourceRange() {
+        if (parent == null) return Range.AttributeRange.UntrackedAttr;
+        return parent.sourceRange(key);
+    }
+
     protected void html(Appendable accum, Document.OutputSettings out) throws IOException {
         html(key, val, accum, out);
     }
diff --git a/src/main/java/org/jsoup/nodes/Attributes.java b/src/main/java/org/jsoup/nodes/Attributes.java
index f24695265a..ecbe9f4ead 100644
--- a/src/main/java/org/jsoup/nodes/Attributes.java
+++ b/src/main/java/org/jsoup/nodes/Attributes.java
@@ -2,10 +2,11 @@
 
 import org.jsoup.SerializationException;
 import org.jsoup.helper.Validate;
+import org.jsoup.internal.SharedConstants;
 import org.jsoup.internal.StringUtil;
 import org.jsoup.parser.ParseSettings;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.util.AbstractMap;
 import java.util.AbstractSet;
@@ -13,17 +14,23 @@
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.ConcurrentModificationException;
+import java.util.HashMap;
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
+import java.util.NoSuchElementException;
 import java.util.Set;
 
 import static org.jsoup.internal.Normalizer.lowerCase;
+import static org.jsoup.internal.SharedConstants.AttrRangeKey;
+import static org.jsoup.nodes.Range.AttributeRange.UntrackedAttr;
 
 /**
  * The attributes of an Element.
  * <p>
- * Attributes are treated as a map: there can be only one value associated with an attribute key/name.
+ * During parsing, attributes in with the same name in an element are deduplicated, according to the configured parser's
+ * attribute case-sensitive setting. It is possible to have duplicate attributes subsequently if
+ * {@link #add(String, String)} vs {@link #put(String, String)} is used.
  * </p>
  * <p>
  * Attribute name and value comparisons are generally <b>case sensitive</b>. By default for HTML, attribute names are
@@ -34,12 +41,13 @@
  * @author Jonathan Hedley, jonathan@hedley.net
  */
 public class Attributes implements Iterable<Attribute>, Cloneable {
+    // Indicates an internal key. Can't be set via HTML. (It could be set via accessor, but not too worried about
+    // that. Suppressed from list, iter.)
+    static final char InternalPrefix = '/';
+
     // The Attributes object is only created on the first use of an attribute; the Element will just have a null
     // Attribute slot otherwise
     protected static final String dataPrefix = "data-";
-    // Indicates a jsoup internal key. Can't be set via HTML. (It could be set via accessor, but not too worried about
-    // that. Suppressed from list, iter.
-    static final char InternalPrefix = '/';
     private static final int InitialCapacity = 3; // sampling found mean count when attrs present = 1.49; 1.08 overall. 2.6:1 don't have any attrs.
 
     // manages the key/val arrays
@@ -51,6 +59,7 @@ public class Attributes implements Iterable<Attribute>, Cloneable {
     private int size = 0; // number of slots used (not total capacity, which is keys.length)
     String[] keys = new String[InitialCapacity];
     Object[] vals = new Object[InitialCapacity]; // Genericish: all non-internal attribute values must be Strings and are cast on access.
+    // todo - make keys iterable without creating Attribute objects
 
     // check there's room for more
     private void checkCapacity(int minNewSize) {
@@ -111,19 +120,6 @@ public String getIgnoreCase(String key) {
         return i == NotFound ? EmptyString : checkNotNull(vals[i]);
     }
 
-    /**
-     Get an arbitrary user data object by key.
-     * @param key case sensitive key to the object.
-     * @return the object associated to this key, or {@code null} if not found.
-     */
-    @Nullable
-    Object getUserData(String key) {
-        Validate.notNull(key);
-        if (!isInternalKey(key)) key = internalKey(key);
-        int i = indexOfKeyIgnoreCase(key);
-        return i == NotFound ? null : vals[i];
-    }
-
     /**
      * Adds a new attribute. Will produce duplicates if the key already exists.
      * @see Attributes#put(String, String)
@@ -143,7 +139,7 @@ private void addObject(String key, @Nullable Object value) {
     /**
      * Set a new attribute, or replace an existing one by key.
      * @param key case sensitive attribute key (not null)
-     * @param value attribute value (may be null, to set a boolean attribute)
+     * @param value attribute value (which can be null, to set a true boolean attribute)
      * @return these attributes, for chaining
      */
     public Attributes put(String key, @Nullable String value) {
@@ -157,21 +153,50 @@ public Attributes put(String key, @Nullable String value) {
     }
 
     /**
-     Put an arbitrary user-data object by key. Will be treated as an internal attribute, so will not be emitted in HTML.
-     * @param key case sensitive key
+     Get the map holding any user-data associated with these Attributes. Will be created empty on first use. Held as
+     an internal attribute, not a field member, to reduce the memory footprint of Attributes when not used. Can hold
+     arbitrary objects; use for source ranges, connecting W3C nodes to Elements, etc.
+     * @return the map holding user-data
+     */
+    Map<String, Object> userData() {
+        final Map<String, Object> userData;
+        int i = indexOfKey(SharedConstants.UserDataKey);
+        if (i == NotFound) {
+            userData = new HashMap<>();
+            addObject(SharedConstants.UserDataKey, userData);
+        } else {
+            //noinspection unchecked
+            userData = (Map<String, Object>) vals[i];
+        }
+        return userData;
+    }
+
+    /**
+     Get an arbitrary user-data object by key.
+     * @param key case-sensitive key to the object.
+     * @return the object associated to this key, or {@code null} if not found.
+     * @see #userData(String key, Object val)
+     * @since 1.17.1
+     */
+    @Nullable
+    public Object userData(String key) {
+        Validate.notNull(key);
+        if (!hasKey(SharedConstants.UserDataKey)) return null; // no user data exists
+        Map<String, Object> userData = userData();
+        return userData.get(key);
+    }
+
+    /**
+     Set an arbitrary user-data object by key. Will be treated as an internal attribute, so will not be emitted in HTML.
+     * @param key case-sensitive key
      * @param value object value
      * @return these attributes
-     * @see #getUserData(String)
+     * @see #userData(String key)
+     * @since 1.17.1
      */
-    Attributes putUserData(String key, Object value) {
+    public Attributes userData(String key, Object value) {
         Validate.notNull(key);
-        if (!isInternalKey(key)) key = internalKey(key);
-        Validate.notNull(value);
-        int i = indexOfKey(key);
-        if (i != NotFound)
-            vals[i] = value;
-        else
-            addObject(key, value);
+        userData().put(key, value);
         return this;
     }
 
@@ -187,7 +212,7 @@ void putIgnoreCase(String key, @Nullable String value) {
     }
 
     /**
-     * Set a new boolean attribute, remove attribute if value is false.
+     * Set a new boolean attribute. Removes the attribute if the value is false.
      * @param key case <b>insensitive</b> attribute key
      * @param value attribute value
      * @return these attributes, for chaining
@@ -202,7 +227,7 @@ public Attributes put(String key, boolean value) {
 
     /**
      Set a new attribute, or replace an existing one by key.
-     @param attribute attribute with case sensitive key
+     @param attribute attribute with case-sensitive key
      @return these attributes, for chaining
      */
     public Attributes put(Attribute attribute) {
@@ -291,6 +316,7 @@ public boolean hasDeclaredValueForKeyIgnoreCase(String key) {
      */
     public int size() {
         return size;
+        // todo - exclude internal attributes from this count - maintain size, count of internals
     }
 
     /**
@@ -319,6 +345,29 @@ public void addAll(Attributes incoming) {
         }
     }
 
+    /**
+     Get the source ranges (start to end position) in the original input source from which this attribute's <b>name</b>
+     and <b>value</b> were parsed.
+     <p>Position tracking must be enabled prior to parsing the content.</p>
+     @param key the attribute name
+     @return the ranges for the attribute's name and value, or {@code untracked} if the attribute does not exist or its range
+     was not tracked.
+     @see org.jsoup.parser.Parser#setTrackPosition(boolean)
+     @see Attribute#sourceRange()
+     @see Node#sourceRange()
+     @see Element#endSourceRange()
+     @since 1.17.1
+     */
+    public Range.AttributeRange sourceRange(String key) {
+        if (!hasKey(key)) return UntrackedAttr;
+        //noinspection unchecked
+        Map<String, Range.AttributeRange> ranges = (Map<String, Range.AttributeRange>) userData(AttrRangeKey);
+        if (ranges == null) return Range.AttributeRange.UntrackedAttr;
+        Range.AttributeRange range = ranges.get(key);
+        return range != null ? range : Range.AttributeRange.UntrackedAttr;
+    }
+
+    @Override
     public Iterator<Attribute> iterator() {
         return new Iterator<Attribute>() {
             int expectedSize = size;
@@ -340,6 +389,7 @@ public boolean hasNext() {
             @Override
             public Attribute next() {
                 checkModified();
+                if (i >= size) throw new NoSuchElementException();
                 final Attribute attr = new Attribute(keys[i], (String) vals[i], Attributes.this);
                 i++;
                 return attr;
@@ -467,11 +517,12 @@ public Attributes clone() {
     }
 
     /**
-     * Internal method. Lowercases all keys.
+     * Internal method. Lowercases all (non-internal) keys.
      */
     public void normalize() {
         for (int i = 0; i < size; i++) {
-            keys[i] = lowerCase(keys[i]);
+            if (!isInternalKey(keys[i]))
+                keys[i] = lowerCase(keys[i]);
         }
     }
 
@@ -565,7 +616,7 @@ static String internalKey(String key) {
         return InternalPrefix + key;
     }
 
-    private boolean isInternalKey(String key) {
+    static boolean isInternalKey(String key) {
         return key != null && key.length() > 1 && key.charAt(0) == InternalPrefix;
     }
 }
diff --git a/src/main/java/org/jsoup/nodes/Comment.java b/src/main/java/org/jsoup/nodes/Comment.java
index 77585bc1da..a3ed2852e1 100644
--- a/src/main/java/org/jsoup/nodes/Comment.java
+++ b/src/main/java/org/jsoup/nodes/Comment.java
@@ -2,8 +2,8 @@
 
 import org.jsoup.parser.ParseSettings;
 import org.jsoup.parser.Parser;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 
 /**
diff --git a/src/main/java/org/jsoup/nodes/DataNode.java b/src/main/java/org/jsoup/nodes/DataNode.java
index 65ae7a338b..4a0cf434f2 100644
--- a/src/main/java/org/jsoup/nodes/DataNode.java
+++ b/src/main/java/org/jsoup/nodes/DataNode.java
@@ -1,6 +1,7 @@
 package org.jsoup.nodes;
 
 import java.io.IOException;
+import org.jsoup.nodes.Entities.EscapeMode;
 
 /**
  A data node, for contents of style, script tags etc, where contents should not show in text().
@@ -40,7 +41,16 @@ public DataNode setWholeData(String data) {
 
     @Override
     void outerHtmlHead(Appendable accum, int depth, Document.OutputSettings out) throws IOException {
-        accum.append(getWholeData()); // data is not escaped in return from data nodes, so " in script, style is plain
+        if (out.syntax() == Document.OutputSettings.Syntax.xml) {
+            // In XML mode, output data nodes as CDATA, so can parse as XML
+            accum
+                .append("<![CDATA[")
+                .append(getWholeData())
+                .append("]]>");
+        } else {
+            // In HTML, data is not escaped in return from data nodes, so " in script, style is plain
+            accum.append(getWholeData());
+        }
     }
 
     @Override
diff --git a/src/main/java/org/jsoup/nodes/Document.java b/src/main/java/org/jsoup/nodes/Document.java
index b2c3f7c88a..fc095170e7 100644
--- a/src/main/java/org/jsoup/nodes/Document.java
+++ b/src/main/java/org/jsoup/nodes/Document.java
@@ -11,8 +11,8 @@
 import org.jsoup.select.Elements;
 import org.jsoup.select.Evaluator;
 import org.jsoup.select.Selector;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.nio.charset.Charset;
 import java.nio.charset.CharsetEncoder;
 import java.util.List;
@@ -488,11 +488,15 @@ public Syntax syntax() {
         /**
          * Set the document's output syntax. Either {@code html}, with empty tags and boolean attributes (etc), or
          * {@code xml}, with self-closing tags.
+         * <p>When set to {@link Document.OutputSettings.Syntax#xml xml}, the {@link #escapeMode() escapeMode} is
+         * automatically set to {@link Entities.EscapeMode#xhtml}, but may be subsequently changed if desired.</p>
          * @param syntax serialization syntax
          * @return the document's output settings, for chaining
          */
         public OutputSettings syntax(Syntax syntax) {
             this.syntax = syntax;
+            if (syntax == Syntax.xml)
+                this.escapeMode(Entities.EscapeMode.xhtml);
             return this;
         }
 
diff --git a/src/main/java/org/jsoup/nodes/Element.java b/src/main/java/org/jsoup/nodes/Element.java
index 956d583377..cfb19113b1 100644
--- a/src/main/java/org/jsoup/nodes/Element.java
+++ b/src/main/java/org/jsoup/nodes/Element.java
@@ -2,7 +2,6 @@
 
 import org.jsoup.helper.ChangeNotifyingArrayList;
 import org.jsoup.helper.Validate;
-import org.jsoup.internal.NonnullByDefault;
 import org.jsoup.internal.StringUtil;
 import org.jsoup.parser.ParseSettings;
 import org.jsoup.parser.Parser;
@@ -15,8 +14,8 @@
 import org.jsoup.select.NodeVisitor;
 import org.jsoup.select.QueryParser;
 import org.jsoup.select.Selector;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.lang.ref.WeakReference;
 import java.util.ArrayList;
@@ -31,6 +30,7 @@
 import java.util.function.Consumer;
 import java.util.regex.Pattern;
 import java.util.regex.PatternSyntaxException;
+import java.util.stream.Stream;
 
 import static org.jsoup.internal.Normalizer.normalize;
 import static org.jsoup.nodes.TextNode.lastCharIsWhitespace;
@@ -41,7 +41,6 @@ An HTML Element consists of a tag name, attributes, and child nodes (including t
  <p>
  From an Element, you can extract data, traverse the node graph, and manipulate the HTML.
 */
-@NonnullByDefault
 public class Element extends Node {
     private static final List<Element> EmptyChildren = Collections.emptyList();
     private static final Pattern ClassSplit = Pattern.compile("\\s+");
@@ -378,6 +377,16 @@ void nodelistChanged() {
         shadowChildrenRef = null;
     }
 
+    /**
+     Returns a Stream of this Element and all of its descendant Elements. The stream has document order.
+     @return a stream of this element and its descendants.
+     @see #nodeStream()
+     @since 1.17.1
+     */
+    public Stream<Element> stream() {
+        return NodeUtils.stream(this, Element.class);
+    }
+
     /**
      * Get this element's child text nodes. The list is unmodifiable but the text nodes may be manipulated.
      * <p>
@@ -454,7 +463,6 @@ public Elements select(Evaluator evaluator) {
         return Selector.select(evaluator, this);
     }
 
-
     /**
      * Find the first Element that matches the {@link Selector} CSS query, with this element as the starting context.
      * <p>This is effectively the same as calling {@code element.select(query).first()}, but is more efficient as query
@@ -697,7 +705,7 @@ public Element insertChildren(int index, Node... children) {
     }
 
     /**
-     * Create a new element by tag name, and add it as the last child.
+     * Create a new element by tag name, and add it as this Element's last child.
      *
      * @param tagName the name of the tag (e.g. {@code div}).
      * @return the new element, to allow you to add content to it, e.g.:
@@ -707,6 +715,13 @@ public Element appendElement(String tagName) {
         return appendElement(tagName, tag.namespace());
     }
 
+    /**
+     * Create a new element by tag name and namespace, add it as this Element's last child.
+     *
+     * @param tagName the name of the tag (e.g. {@code div}).
+     * @param namespace the namespace of the tag (e.g. {@link Parser#NamespaceHtml})
+     * @return the new element, in the specified namespace
+     */
     public Element appendElement(String tagName, String namespace) {
         Element child = new Element(Tag.valueOf(tagName, namespace, NodeUtils.parser(this).settings()), baseUri());
         appendChild(child);
@@ -714,7 +729,7 @@ public Element appendElement(String tagName, String namespace) {
     }
 
     /**
-     * Create a new element by tag name, and add it as the first child.
+     * Create a new element by tag name, and add it as this Element's first child.
      *
      * @param tagName the name of the tag (e.g. {@code div}).
      * @return the new element, to allow you to add content to it, e.g.:
@@ -724,6 +739,13 @@ public Element prependElement(String tagName) {
         return prependElement(tagName, tag.namespace());
     }
 
+    /**
+     * Create a new element by tag name and namespace, and add it as this Element's first child.
+     *
+     * @param tagName the name of the tag (e.g. {@code div}).
+     * @param namespace the namespace of the tag (e.g. {@link Parser#NamespaceHtml})
+     * @return the new element, in the specified namespace
+     */
     public Element prependElement(String tagName, String namespace) {
         Element child = new Element(Tag.valueOf(tagName, namespace, NodeUtils.parser(this).settings()), baseUri());
         prependChild(child);
@@ -1389,7 +1411,7 @@ public void tail(Node node, int depth) {
      */
     public String wholeText() {
         final StringBuilder accum = StringUtil.borrowBuilder();
-        NodeTraversor.traverse((node, depth) -> appendWholeText(node, accum), this);
+        nodeStream().forEach(node -> appendWholeText(node, accum));
         return StringUtil.releaseBuilder(accum);
     }
 
@@ -1402,7 +1424,7 @@ private static void appendWholeText(Node node, StringBuilder accum) {
     }
 
     /**
-     Get the non-normalized, decoded text of this element, <b>not including</b> any child elements, including only any
+     Get the non-normalized, decoded text of this element, <b>not including</b> any child elements, including any
      newlines and spaces present in the original source.
      @return decoded, non-normalized text that is a direct child of this Element
      @see #text()
@@ -1706,10 +1728,10 @@ public Element val(String value) {
     /**
      Get the source range (start and end positions) of the end (closing) tag for this Element. Position tracking must be
      enabled prior to parsing the content.
-     @return the range of the closing tag for this element, if it was explicitly closed in the source. {@code Untracked}
-     otherwise.
+     @return the range of the closing tag for this element, or {@code untracked} if its range was not tracked.
      @see org.jsoup.parser.Parser#setTrackPosition(boolean)
      @see Node#sourceRange()
+     @see Range#isImplicit()
      @since 1.15.2
      */
     public Range endSourceRange() {
@@ -1799,7 +1821,9 @@ public Element clone() {
     @Override
     public Element shallowClone() {
         // simpler than implementing a clone version with no child copy
-        return new Element(tag, baseUri(), attributes == null ? null : attributes.clone());
+        String baseUri = baseUri();
+        if (baseUri.isEmpty()) baseUri = null; // saves setting a blank internal attribute
+        return new Element(tag, baseUri, attributes == null ? null : attributes.clone());
     }
 
     @Override
@@ -1816,8 +1840,9 @@ protected Element doClone(@Nullable Node parent) {
     @Override
     public Element clearAttributes() {
         if (attributes != null) {
-            super.clearAttributes();
-            attributes = null;
+            super.clearAttributes(); // keeps internal attributes via iterator
+            if (attributes.size() == 0)
+                attributes = null; // only remove entirely if no internal attributes
         }
 
         return this;
@@ -1849,17 +1874,15 @@ public Element forEachNode(Consumer<? super Node> action) {
      @param action the function to perform on the element
      @return this Element, for chaining
      @see Node#forEachNode(Consumer)
+     @deprecated use {@link #stream()}.{@link Stream#forEach(Consumer) forEach(Consumer)} instead. (Removing this method
+     so Element can implement Iterable, which this signature conflicts with due to the non-void return.)
      */
+    @Deprecated
     public Element forEach(Consumer<? super Element> action) {
-        Validate.notNull(action);
-        NodeTraversor.traverse((node, depth) -> {
-            if (node instanceof Element)
-                action.accept((Element) node);
-        }, this);
+        stream().forEach(action);
         return this;
     }
 
-
     @Override
     public Element filter(NodeFilter nodeFilter) {
         return  (Element) super.filter(nodeFilter);
diff --git a/src/main/java/org/jsoup/nodes/Entities.java b/src/main/java/org/jsoup/nodes/Entities.java
index be447bceb9..3fb39a8070 100644
--- a/src/main/java/org/jsoup/nodes/Entities.java
+++ b/src/main/java/org/jsoup/nodes/Entities.java
@@ -6,8 +6,8 @@
 import org.jsoup.nodes.Document.OutputSettings;
 import org.jsoup.parser.CharacterReader;
 import org.jsoup.parser.Parser;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.nio.charset.CharsetEncoder;
 import java.util.Arrays;
diff --git a/src/main/java/org/jsoup/nodes/LeafNode.java b/src/main/java/org/jsoup/nodes/LeafNode.java
index d4117a7342..8e5df5f07a 100644
--- a/src/main/java/org/jsoup/nodes/LeafNode.java
+++ b/src/main/java/org/jsoup/nodes/LeafNode.java
@@ -2,7 +2,10 @@
 
 import java.util.List;
 
-abstract class LeafNode extends Node {
+/**
+ A node that does not hold any children. E.g.: {@link TextNode}, {@link DataNode}, {@link Comment}.
+ */
+public abstract class LeafNode extends Node {
     Object value; // either a string value, or an attribute map (in the rare case multiple attributes are set)
 
     protected final boolean hasAttributes() {
diff --git a/src/main/java/org/jsoup/nodes/Node.java b/src/main/java/org/jsoup/nodes/Node.java
index 3c55690f3a..c84a6a0f69 100644
--- a/src/main/java/org/jsoup/nodes/Node.java
+++ b/src/main/java/org/jsoup/nodes/Node.java
@@ -6,8 +6,8 @@
 import org.jsoup.select.NodeFilter;
 import org.jsoup.select.NodeTraversor;
 import org.jsoup.select.NodeVisitor;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Arrays;
@@ -16,9 +16,11 @@
 import java.util.LinkedList;
 import java.util.List;
 import java.util.function.Consumer;
+import java.util.stream.Stream;
 
 /**
- The base, abstract Node model. Elements, Documents, Comments etc are all Node instances.
+ The base, abstract Node model. {@link Element}, {@link Document}, {@link Comment}, {@link TextNode}, et al.,
+ are instances of Node.
 
  @author Jonathan Hedley, jonathan@hedley.net */
 public abstract class Node implements Cloneable {
@@ -66,7 +68,7 @@ public boolean hasParent() {
     /**
      * Get an attribute's value by its key. <b>Case insensitive</b>
      * <p>
-     * To get an absolute URL from an attribute that may be a relative URL, prefix the key with <code><b>abs</b></code>,
+     * To get an absolute URL from an attribute that may be a relative URL, prefix the key with <code><b>abs:</b></code>,
      * which is a shortcut to the {@link #absUrl} method.
      * </p>
      * E.g.:
@@ -225,7 +227,8 @@ public String absUrl(String attributeKey) {
     /**
      Get a child node by its 0-based index.
      @param index index of child node
-     @return the child node at this index. Throws a {@code IndexOutOfBoundsException} if the index is out of bounds.
+     @return the child node at this index.
+     @throws IndexOutOfBoundsException if the index is out of bounds.
      */
     public Node childNode(int index) {
         return ensureChildNodes().get(index);
@@ -593,7 +596,7 @@ public List<Node> siblingNodes() {
 
     /**
      Get this node's next sibling.
-     @return next sibling, or @{code null} if this is the last sibling
+     @return next sibling, or {@code null} if this is the last sibling
      */
     public @Nullable Node nextSibling() {
         if (parentNode == null)
@@ -682,12 +685,12 @@ public Node traverse(NodeVisitor nodeVisitor) {
      */
     public Node forEachNode(Consumer<? super Node> action) {
         Validate.notNull(action);
-        NodeTraversor.traverse((node, depth) -> action.accept(node), this);
+        nodeStream().forEach(action);
         return this;
     }
 
     /**
-     * Perform a depth-first filtering through this node and its descendants.
+     * Perform a depth-first filtered traversal through this node and its descendants.
      * @param nodeFilter the filter callbacks to perform on each node
      * @return this node, for chaining
      */
@@ -697,6 +700,27 @@ public Node filter(NodeFilter nodeFilter) {
         return this;
     }
 
+    /**
+     Returns a Stream of this Node and all of its descendant Nodes. The stream has document order.
+     @return a stream of all nodes.
+     @see Element#stream()
+     @since 1.17.1
+     */
+    public Stream<Node> nodeStream() {
+        return NodeUtils.stream(this, Node.class);
+    }
+
+    /**
+     Returns a Stream of this and descendant nodes, containing only nodes of the specified type. The stream has document
+     order.
+     @return a stream of nodes filtered by type.
+     @see Element#stream()
+     @since 1.17.1
+     */
+    public <T extends Node> Stream<T> nodeStream(Class<T> type) {
+        return NodeUtils.stream(this, type);
+    }
+
     /**
      Get the outer HTML of this node. For example, on a {@code p} element, may return {@code <p>Para</p>}.
      @return outer HTML
@@ -734,11 +758,14 @@ public <T extends Appendable> T html(T appendable) {
     }
 
     /**
-     Get the source range (start and end positions) in the original input source that this node was parsed from. Position
-     tracking must be enabled prior to parsing the content. For an Element, this will be the positions of the start tag.
-     @return the range for the start of the node.
+     Get the source range (start and end positions) in the original input source from which this node was parsed.
+     Position tracking must be enabled prior to parsing the content. For an Element, this will be the positions of the
+     start tag.
+     @return the range for the start of the node, or {@code untracked} if its range was not tracked.
      @see org.jsoup.parser.Parser#setTrackPosition(boolean)
+     @see Range#isImplicit()
      @see Element#endSourceRange()
+     @see Attributes#sourceRange(String name)
      @since 1.15.2
      */
     public Range sourceRange() {
diff --git a/src/main/java/org/jsoup/nodes/NodeIterator.java b/src/main/java/org/jsoup/nodes/NodeIterator.java
new file mode 100644
index 0000000000..58f97a3df1
--- /dev/null
+++ b/src/main/java/org/jsoup/nodes/NodeIterator.java
@@ -0,0 +1,124 @@
+package org.jsoup.nodes;
+
+import org.jsoup.helper.Validate;
+import org.jspecify.annotations.Nullable;
+
+import java.util.Iterator;
+import java.util.NoSuchElementException;
+
+/**
+ Iterate through a Node and its tree of descendants, in document order, and returns nodes of the specified type. This
+ iterator supports structural changes to the tree during the traversal, such as {@link Node#remove()},
+ {@link Node#replaceWith(Node)}, {@link Node#wrap(String)}, etc.
+ <p>See also the {@link org.jsoup.select.NodeTraversor NodeTraversor} if {@code head} and {@code tail} callbacks are
+ desired for each node.</p>
+ @since 1.17.1
+ */
+public class NodeIterator<T extends Node> implements Iterator<T> {
+    private Node root;                      // root / starting node
+    private @Nullable T next;               // the next node to return
+    private Node current;                   // the current (last emitted) node
+    private Node previous;                  // the previously emitted node; used to recover from structural changes
+    private @Nullable Node currentParent;   // the current node's parent; used to detect structural changes
+    private final Class<T> type;            // the desired node class type
+
+    /**
+     Create a NoteIterator that will iterate the supplied node, and all of its descendants. The returned {@link #next}
+     type will be filtered to the input type.
+     * @param start initial node
+     * @param type node type to filter for
+     */
+    public NodeIterator(Node start, Class<T> type) {
+        Validate.notNull(start);
+        Validate.notNull(type);
+        this.type = type;
+
+        restart(start);
+    }
+
+    /**
+     Create a NoteIterator that will iterate the supplied node, and all of its descendants. All node types will be
+     returned.
+     * @param start initial node
+     */
+    public static NodeIterator<Node> from(Node start) {
+        return new NodeIterator<>(start, Node.class);
+    }
+
+    /**
+     Restart this Iterator from the specified start node. Will act as if it were newly constructed. Useful for e.g. to
+     save some GC if the iterator is used in a tight loop.
+     * @param start the new start node.
+     */
+    public void restart(Node start) {
+        if (type.isInstance(start))
+            //noinspection unchecked
+            next = (T) start; // first next() will be the start node
+
+        root = previous = current = start;
+        currentParent = current.parent();
+    }
+
+    @Override public boolean hasNext() {
+        maybeFindNext();
+        return next != null;
+    }
+
+    @Override public T next() {
+        maybeFindNext();
+        if (next == null) throw new NoSuchElementException();
+
+        T result = next;
+        previous = current;
+        current = next;
+        currentParent = current.parent();
+        next = null;
+        return result;
+    }
+
+    /**
+     If next is not null, looks for and sets next. If next is null after this, we have reached the end.
+     */
+    private void maybeFindNext() {
+        if (next != null) return;
+
+        //  change detected (removed or replaced), redo from previous
+        if (currentParent != null && !current.hasParent())
+            current = previous;
+
+        next = findNextNode();
+    }
+
+    private @Nullable T findNextNode() {
+        Node node = current;
+        while (true) {
+            if (node.childNodeSize() > 0)
+                node = node.childNode(0);                   // descend children
+            else if (root.equals(node))
+                node = null;                                // complete when all children of root are fully visited
+            else if (node.nextSibling() != null)
+                node = node.nextSibling();                  // in a descendant with no more children; traverse
+            else {
+                while (true) {
+                    node = node.parent();                   // pop out of descendants
+                    if (node == null || root.equals(node))
+                        return null;                        // got back to root; complete
+                    if (node.nextSibling() != null) {
+                        node = node.nextSibling();          // traverse
+                        break;
+                    }
+                }
+            }
+            if (node == null)
+                return null;                                // reached the end
+
+            if (type.isInstance(node))
+                //noinspection unchecked
+                return (T) node;
+        }
+    }
+
+    @Override public void remove() {
+        current.remove();
+    }
+}
diff --git a/src/main/java/org/jsoup/nodes/NodeUtils.java b/src/main/java/org/jsoup/nodes/NodeUtils.java
index 4bd7e019ac..6d3bb814ab 100644
--- a/src/main/java/org/jsoup/nodes/NodeUtils.java
+++ b/src/main/java/org/jsoup/nodes/NodeUtils.java
@@ -6,7 +6,12 @@
 import org.jsoup.parser.Parser;
 import org.w3c.dom.NodeList;
 
+import java.util.Iterator;
 import java.util.List;
+import java.util.Spliterator;
+import java.util.Spliterators;
+import java.util.stream.Stream;
+import java.util.stream.StreamSupport;
 
 /**
  * Internal helpers for Nodes, to keep the actual node APIs relatively clean. A jsoup internal class, so don't use it as
@@ -47,4 +52,18 @@ static <T extends Node> List<T> selectXpath(String xpath, Element el, Class<T> n
         NodeList nodeList = w3c.selectXpath(xpath, contextNode);
         return w3c.sourceNodes(nodeList, nodeType);
     }
+
+    /** Creates a Stream, starting with the supplied node. */
+    static <T extends Node> Stream<T> stream(Node start, Class<T> type) {
+        NodeIterator<T> iterator = new NodeIterator<>(start, type);
+        Spliterator<T> spliterator = spliterator(iterator);
+
+        return StreamSupport.stream(spliterator, false);
+    }
+
+    static <T extends Node> Spliterator<T> spliterator(Iterator<T> iterator) {
+        return Spliterators.spliteratorUnknownSize(
+                iterator,
+                Spliterator.DISTINCT | Spliterator.NONNULL | Spliterator.ORDERED);
+    }
 }
diff --git a/src/main/java/org/jsoup/nodes/Range.java b/src/main/java/org/jsoup/nodes/Range.java
index d110d4c8d2..955c043a8c 100644
--- a/src/main/java/org/jsoup/nodes/Range.java
+++ b/src/main/java/org/jsoup/nodes/Range.java
@@ -1,6 +1,6 @@
 package org.jsoup.nodes;
 
-import org.jsoup.helper.Validate;
+import static org.jsoup.internal.SharedConstants.*;
 
 /**
  A Range object tracks the character positions in the original input source where a Node starts or ends. If you want to
@@ -10,12 +10,11 @@
  @since 1.15.2
  */
 public class Range {
+    private static final Position UntrackedPos = new Position(-1, -1, -1);
     private final Position start, end;
 
-    private static final String RangeKey = Attributes.internalKey("jsoup.sourceRange");
-    private static final String EndRangeKey = Attributes.internalKey("jsoup.endSourceRange");
-    private static final Position UntrackedPos = new Position(-1, -1, -1);
-    private static final Range Untracked = new Range(UntrackedPos, UntrackedPos);
+    /** An untracked source range. */
+    static final Range Untracked = new Range(UntrackedPos, UntrackedPos);
 
     /**
      Creates a new Range with start and end Positions. Called by TreeBuilder when position tracking is on.
@@ -35,6 +34,15 @@ public Position start() {
         return start;
     }
 
+    /**
+     Get the starting cursor position of this range.
+     @return the 0-based start cursor position.
+     @since 1.17.1
+     */
+    public int startPos() {
+        return start.pos;
+    }
+
     /**
      Get the end position of this node.
      * @return the end position
@@ -43,6 +51,15 @@ public Position end() {
         return end;
     }
 
+    /**
+     Get the ending cursor position of this range.
+     @return the 0-based ending cursor position.
+     @since 1.17.1
+     */
+    public int endPos() {
+        return end.pos;
+    }
+
     /**
      Test if this source range was tracked during parsing.
      * @return true if this was tracked during parsing, false otherwise (and all fields will be {@code -1}).
@@ -51,6 +68,20 @@ public boolean isTracked() {
         return this != Untracked;
     }
 
+    /**
+     Checks if the range represents a node that was implicitly created / closed.
+     <p>For example, with HTML of {@code <p>One<p>Two}, both {@code p} elements will have an explicit
+     {@link Element#sourceRange()} but an implicit {@link Element#endSourceRange()} marking the end position, as neither
+     have closing {@code </p>} tags. The TextNodes will have explicit sourceRanges.
+     <p>A range is considered implicit if its start and end positions are the same.
+     @return true if the range is tracked and its start and end positions are the same, false otherwise.
+     @since 1.17.1
+     */
+    public boolean isImplicit() {
+        if (!isTracked()) return false;
+        return start.equals(end);
+    }
+
     /**
      Retrieves the source range for a given Node.
      * @param node the node to retrieve the position for
@@ -59,20 +90,16 @@ public boolean isTracked() {
      */
     static Range of(Node node, boolean start) {
         final String key = start ? RangeKey : EndRangeKey;
-        if (!node.hasAttr(key))
-            return Untracked;
-        else
-            return (Range) Validate.ensureNotNull(node.attributes().getUserData(key));
+        if (!node.hasAttributes()) return Untracked;
+        Object range = node.attributes().userData(key);
+        return range != null ? (Range) range : Untracked;
     }
 
     /**
-     Internal jsoup method, called by the TreeBuilder. Tracks a Range for a Node.
-     * @param node the node to associate this position to
-     * @param start if this is the starting range. {@code false} for Element end tags.
+     @deprecated no-op; internal method moved out of visibility
      */
-    public void track(Node node, boolean start) {
-        node.attributes().putUserData(start ? RangeKey : EndRangeKey, this);
-    }
+    @Deprecated
+    public void track(Node node, boolean start) {}
 
     @Override
     public boolean equals(Object o) {
@@ -124,7 +151,7 @@ public Position(int pos, int lineNumber, int columnNumber) {
 
         /**
          Gets the position index (0-based) of the original input source that this Position was read at. This tracks the
-         total number of characters read into the source at this position, regardless of the number of preceeding lines.
+         total number of characters read into the source at this position, regardless of the number of preceding lines.
          * @return the position, or {@code -1} if untracked.
          */
         public int pos() {
@@ -182,6 +209,51 @@ public int hashCode() {
             result = 31 * result + columnNumber;
             return result;
         }
+    }
+
+    public static class AttributeRange {
+        static final AttributeRange UntrackedAttr = new AttributeRange(Range.Untracked, Range.Untracked);
 
+        private final Range nameRange;
+        private final Range valueRange;
+
+        /** Creates a new AttributeRange. Called during parsing by Token.StartTag. */
+        public AttributeRange(Range nameRange, Range valueRange) {
+            this.nameRange = nameRange;
+            this.valueRange = valueRange;
+        }
+
+        /** Get the source range for the attribute's name. */
+        public Range nameRange() {
+            return nameRange;
+        }
+
+        /** Get the source range for the attribute's value. */
+        public Range valueRange() {
+            return valueRange;
+        }
+
+        /** Get a String presentation of this Attribute range, in the form
+         {@code line,column:pos-line,column:pos=line,column:pos-line,column:pos} (name start - name end = val start - val end).
+         . */
+        @Override public String toString() {
+            return nameRange().toString() + "=" + valueRange().toString();
+        }
+
+        @Override public boolean equals(Object o) {
+            if (this == o) return true;
+            if (o == null || getClass() != o.getClass()) return false;
+
+            AttributeRange that = (AttributeRange) o;
+
+            if (!nameRange.equals(that.nameRange)) return false;
+            return valueRange.equals(that.valueRange);
+        }
+
+        @Override public int hashCode() {
+            int result = nameRange.hashCode();
+            result = 31 * result + valueRange.hashCode();
+            return result;
+        }
     }
 }
diff --git a/src/main/java/org/jsoup/nodes/package-info.java b/src/main/java/org/jsoup/nodes/package-info.java
index 7e66d2cab8..9a7214ffd6 100644
--- a/src/main/java/org/jsoup/nodes/package-info.java
+++ b/src/main/java/org/jsoup/nodes/package-info.java
@@ -1,7 +1,7 @@
 /**
  HTML document structure nodes.
  */
-@NonnullByDefault
+@NullMarked
 package org.jsoup.nodes;
 
-import org.jsoup.internal.NonnullByDefault;
+import org.jspecify.annotations.NullMarked;
diff --git a/src/main/java/org/jsoup/package-info.java b/src/main/java/org/jsoup/package-info.java
index 835aafbae5..036be0070b 100644
--- a/src/main/java/org/jsoup/package-info.java
+++ b/src/main/java/org/jsoup/package-info.java
@@ -1,7 +1,7 @@
 /**
  Contains the main {@link org.jsoup.Jsoup} class, which provides convenient static access to the jsoup functionality.
  */
-@NonnullByDefault
+@NullMarked
 package org.jsoup;
 
-import org.jsoup.internal.NonnullByDefault;
+import org.jspecify.annotations.NullMarked;
diff --git a/src/main/java/org/jsoup/parser/CharacterReader.java b/src/main/java/org/jsoup/parser/CharacterReader.java
index 1d00ec6ffb..d2fc46601c 100644
--- a/src/main/java/org/jsoup/parser/CharacterReader.java
+++ b/src/main/java/org/jsoup/parser/CharacterReader.java
@@ -2,8 +2,8 @@
 
 import org.jsoup.UncheckedIOException;
 import org.jsoup.helper.Validate;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.io.Reader;
 import java.io.StringReader;
@@ -190,13 +190,13 @@ int columnNumber(int pos) {
     }
 
     /**
-     Get a formatted string representing the current line and cursor positions. E.g. <code>5:10</code> indicating line
+     Get a formatted string representing the current line and column positions. E.g. <code>5:10</code> indicating line
      number 5 and column number 10.
      @return line:col position
      @since 1.14.3
      @see #trackNewlines(boolean)
      */
-    String cursorPos() {
+    String posLineCol() {
         return lineNumber() + ":" + columnNumber();
     }
 
@@ -451,11 +451,12 @@ String consumeAttributeQuoted(final boolean single) {
                     break OUTER;
                 case '\'':
                     if (single) break OUTER;
+                    break;
                 case '"':
                     if (!single) break OUTER;
-                default:
-                    pos++;
+                    break;
             }
+            pos++;
         }
         bufPos = pos;
         return pos > start ? cacheString(charBuf, stringCache, start, pos -start) : "";
diff --git a/src/main/java/org/jsoup/parser/HtmlTreeBuilder.java b/src/main/java/org/jsoup/parser/HtmlTreeBuilder.java
index e29051ba27..b0fc8f3f62 100644
--- a/src/main/java/org/jsoup/parser/HtmlTreeBuilder.java
+++ b/src/main/java/org/jsoup/parser/HtmlTreeBuilder.java
@@ -3,6 +3,7 @@
 import org.jsoup.helper.Validate;
 import org.jsoup.internal.Normalizer;
 import org.jsoup.internal.StringUtil;
+import org.jsoup.nodes.Attributes;
 import org.jsoup.nodes.CDataNode;
 import org.jsoup.nodes.Comment;
 import org.jsoup.nodes.DataNode;
@@ -11,10 +12,8 @@
 import org.jsoup.nodes.FormElement;
 import org.jsoup.nodes.Node;
 import org.jsoup.nodes.TextNode;
-import org.jsoup.parser.Token.StartTag;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
-import javax.annotation.ParametersAreNonnullByDefault;
 import java.io.Reader;
 import java.io.StringReader;
 import java.util.ArrayList;
@@ -66,7 +65,7 @@ public class HtmlTreeBuilder extends TreeBuilder {
     private boolean fosterInserts; // if next inserts should be fostered
     private boolean fragmentParsing; // if parsing a fragment of html
 
-    ParseSettings defaultSettings() {
+    @Override ParseSettings defaultSettings() {
         return ParseSettings.htmlDefault;
     }
 
@@ -75,7 +74,7 @@ HtmlTreeBuilder newInstance() {
         return new HtmlTreeBuilder();
     }
 
-    @Override @ParametersAreNonnullByDefault
+    @Override
     protected void initialiseParse(Reader input, String baseUri, Parser parser) {
         super.initialiseParse(input, baseUri, parser);
 
@@ -95,7 +94,7 @@ protected void initialiseParse(Reader input, String baseUri, Parser parser) {
         fragmentParsing = false;
     }
 
-    List<Node> parseFragment(String inputFragment, @Nullable Element context, String baseUri, Parser parser) {
+    @Override List<Node> parseFragment(String inputFragment, @Nullable Element context, String baseUri, Parser parser) {
         // context may be null
         state = HtmlTreeBuilderState.Initial;
         initialiseParse(new StringReader(inputFragment), baseUri, parser);
@@ -136,7 +135,7 @@ List<Node> parseFragment(String inputFragment, @Nullable Element context, String
             }
             root = new Element(tagFor(contextTag, settings), baseUri);
             doc.appendChild(root);
-            stack.add(root);
+            push(root);
             resetInsertionMode();
 
             // setup form element to nearest form on context (up ancestor chain). ensures form controls are associated
@@ -166,16 +165,11 @@ List<Node> parseFragment(String inputFragment, @Nullable Element context, String
 
     @Override
     protected boolean process(Token token) {
-        currentToken = token;
-
-    if (shouldDispatchToCurrentInsertionMode(token)) {
-            return this.state.process(token, this);
-        } else {
-            return ForeignContent.process(token, this);
-        }
+        HtmlTreeBuilderState dispatch = useCurrentOrForeignInsert(token) ? this.state : ForeignContent;
+        return dispatch.process(token, this);
     }
 
-    boolean shouldDispatchToCurrentInsertionMode(Token token) {
+    boolean useCurrentOrForeignInsert(Token token) {
         // https://html.spec.whatwg.org/multipage/parsing.html#tree-construction
         // If the stack of open elements is empty
         if (stack.isEmpty())
@@ -214,7 +208,7 @@ boolean shouldDispatchToCurrentInsertionMode(Token token) {
         return token.isEOF();
     }
 
-    boolean isMathmlTextIntegration(Element el) {
+    static boolean isMathmlTextIntegration(Element el) {
         /*
         A node is a MathML text integration point if it is one of the following elements:
         A MathML mi element
@@ -227,7 +221,7 @@ boolean isMathmlTextIntegration(Element el) {
             && StringUtil.inSorted(el.normalName(), TagMathMlTextIntegration));
     }
 
-    boolean isHtmlIntegration(Element el) {
+    static boolean isHtmlIntegration(Element el) {
         /*
         A node is an HTML integration point if it is one of the following elements:
         A MathML annotation-xml element whose start tag token had an attribute with the name "encoding" whose value was an ASCII case-insensitive match for the string "text/html"
@@ -250,7 +244,6 @@ boolean isHtmlIntegration(Element el) {
     }
 
     boolean process(Token token, HtmlTreeBuilderState state) {
-        currentToken = token;
         return state.process(token, this);
     }
 
@@ -308,105 +301,122 @@ void error(HtmlTreeBuilderState state) {
                 currentToken.tokenType(), currentToken, state));
     }
 
+    Element createElementFor(Token.StartTag startTag, String namespace, boolean forcePreserveCase) {
+        // dedupe and normalize the attributes:
+        Attributes attributes = startTag.attributes;
+        if (!forcePreserveCase)
+            attributes = settings.normalizeAttributes(attributes);
+        if (attributes != null && !attributes.isEmpty()) {
+            int dupes = attributes.deduplicate(settings);
+            if (dupes > 0) {
+                error("Dropped duplicate attribute(s) in tag [%s]", startTag.normalName);
+            }
+        }
+
+        Tag tag = tagFor(startTag.tagName, namespace,
+            forcePreserveCase ? ParseSettings.preserveCase : settings);
+
+        return (tag.normalName().equals("form")) ?
+            new FormElement(tag, null, attributes) :
+            new Element(tag, null, attributes);
+    }
+
     /** Inserts an HTML element for the given tag) */
-    Element insert(final Token.StartTag startTag) {
-        dedupeAttributes(startTag);
+    Element insertElementFor(final Token.StartTag startTag) {
+        Element el = createElementFor(startTag, NamespaceHtml, false);
+        doInsertElement(el, startTag);
 
-        // handle empty unknown tags
-        // when the spec expects an empty tag, will directly hit insertEmpty, so won't generate this fake end tag.
+        // handle self-closing tags. when the spec expects an empty tag, will directly hit insertEmpty, so won't generate this fake end tag.
         if (startTag.isSelfClosing()) {
-            Element el = insertEmpty(startTag);
-            stack.add(el);
+            Tag tag = el.tag();
+            if (tag.isKnownTag()) {
+                if (!tag.isEmpty())
+                    tokeniser.error("Tag [%s] cannot be self closing; not a void tag", tag.normalName());
+                // else: ok
+            }
+            else { // unknown tag: remember this is self-closing, for output
+                tag.setSelfClosing();
+            }
+
+            // effectively a pop, but fiddles with the state. handles empty style, title etc which would otherwise leave us in data state
             tokeniser.transition(TokeniserState.Data); // handles <script />, otherwise needs breakout steps from script data
             tokeniser.emit(emptyEnd.reset().name(el.tagName()));  // ensure we get out of whatever state we are in. emitted for yielded processing
-            return el;
         }
 
-        Element el = new Element(tagFor(startTag.name(), settings), null, settings.normalizeAttributes(startTag.attributes));
-        insert(el, startTag);
         return el;
     }
 
     /**
      Inserts a foreign element. Preserves the case of the tag name and of the attributes.
      */
-    Element insertForeign(final Token.StartTag startTag, String namespace) {
-        dedupeAttributes(startTag);
-        Tag tag = tagFor(startTag.name(), namespace, ParseSettings.preserveCase);
-        Element el = new Element(tag, null, ParseSettings.preserveCase.normalizeAttributes(startTag.attributes));
-        insert(el, startTag);
+    Element insertForeignElementFor(final Token.StartTag startTag, String namespace) {
+        Element el = createElementFor(startTag, namespace, true);
+        doInsertElement(el, startTag);
 
         if (startTag.isSelfClosing()) {
-            tag.setSelfClosing(); // remember this is self-closing for output
+            el.tag().setSelfClosing(); // remember this is self-closing for output
             pop();
         }
 
         return el;
     }
 
-	Element insertStartTag(String startTagName) {
-        Element el = new Element(tagFor(startTagName, settings), null);
-        insert(el);
+    Element insertEmptyElementFor(Token.StartTag startTag) {
+        Element el = createElementFor(startTag, NamespaceHtml, false);
+        doInsertElement(el, startTag);
+        pop();
         return el;
     }
 
-    void insert(Element el) {
-        insertNode(el, null);
-        stack.add(el);
-    }
-
-    private void insert(Element el, @Nullable Token token) {
-        insertNode(el, token);
-        stack.add(el);
-    }
-
-    Element insertEmpty(Token.StartTag startTag) {
-        dedupeAttributes(startTag);
+    FormElement insertFormElement(Token.StartTag startTag, boolean onStack, boolean checkTemplateStack) {
+        FormElement el = (FormElement) createElementFor(startTag, NamespaceHtml, false);
 
-        Tag tag = tagFor(startTag.name(), settings);
-        Element el = new Element(tag, null, settings.normalizeAttributes(startTag.attributes));
-        insertNode(el, startTag);
-        if (startTag.isSelfClosing()) {
-            if (tag.isKnownTag()) {
-                if (!tag.isEmpty())
-                    tokeniser.error("Tag [%s] cannot be self closing; not a void tag", tag.normalName());
-            }
-            else // unknown tag, remember this is self-closing for output
-                tag.setSelfClosing();
-        }
-        return el;
-    }
-
-    FormElement insertForm(Token.StartTag startTag, boolean onStack, boolean checkTemplateStack) {
-        dedupeAttributes(startTag);
-
-        Tag tag = tagFor(startTag.name(), settings);
-        FormElement el = new FormElement(tag, null, settings.normalizeAttributes(startTag.attributes));
         if (checkTemplateStack) {
             if(!onStack("template"))
                 setFormElement(el);
         } else
             setFormElement(el);
 
-        insertNode(el, startTag);
-        if (onStack)
-            stack.add(el);
+        doInsertElement(el, startTag);
+        if (!onStack) pop();
         return el;
     }
 
-    void insert(Token.Comment commentToken) {
-        Comment comment = new Comment(commentToken.getData());
-        insertNode(comment, commentToken);
+    /** Inserts the Element onto the stack. All element inserts must run through this method. Performs any general
+     tests on the Element before insertion.
+     * @param el the Element to insert and make the current element
+     * @param token the token this element was parsed from. If null, uses a zero-width current token as intrinsic insert
+     */
+    private void doInsertElement(Element el, @Nullable Token token) {
+        if (el.tag().isFormListed() && formElement != null)
+            formElement.addElement(el); // connect form controls to their form element
+
+        // in HTML, the xmlns attribute if set must match what the parser set the tag's namespace to
+        if (el.hasAttr("xmlns") && !el.attr("xmlns").equals(el.tag().namespace()))
+            error("Invalid xmlns attribute [%s] on tag [%s]", el.attr("xmlns"), el.tagName());
+
+        if (isFosterInserts() && StringUtil.inSorted(currentElement().normalName(), InTableFoster))
+            insertInFosterParent(el);
+        else
+            currentElement().appendChild(el);
+
+        push(el);
+    }
+
+    void insertCommentNode(Token.Comment token) {
+        Comment node = new Comment(token.getData());
+        currentElement().appendChild(node);
+        onNodeInserted(node);
     }
 
     /** Inserts the provided character token into the current element. */
-    void insert(Token.Character characterToken) {
-        final Element el = currentElement(); // will be doc if no current element; allows for whitespace to be inserted into the doc root object (not on the stack)
-        insert(characterToken, el);
+    void insertCharacterNode(Token.Character characterToken) {
+        Element el = currentElement(); // will be doc if no current element; allows for whitespace to be inserted into the doc root object (not on the stack)
+        insertCharacterToElement(characterToken, el);
     }
 
     /** Inserts the provided character token into the provided element. */
-    void insert(Token.Character characterToken, Element el) {
+    void insertCharacterToElement(Token.Character characterToken, Element el) {
         final Node node;
         final String tagName = el.normalName();
         final String data = characterToken.getData();
@@ -418,48 +428,7 @@ else if (isContentForTagData(tagName))
         else
             node = new TextNode(data);
         el.appendChild(node); // doesn't use insertNode, because we don't foster these; and will always have a stack.
-        onNodeInserted(node, characterToken);
-    }
-
-    /** Inserts the provided Node into the current element. */
-    private void insertNode(Node node, @Nullable Token token) {
-        // if the stack hasn't been set up yet, elements (doctype, comments) go into the doc
-        if (stack.isEmpty())
-            doc.appendChild(node);
-        else if (isFosterInserts() && StringUtil.inSorted(currentElement().normalName(), InTableFoster))
-            insertInFosterParent(node);
-        else
-            currentElement().appendChild(node);
-
-        if (node instanceof Element) {
-            Element el = (Element) node;
-            if (el.tag().isFormListed() && formElement != null)
-                formElement.addElement(el); // connect form controls to their form element
-
-            // in HTML, the xmlns attribute if set must match what the parser set the tag's namespace to
-            if (el.hasAttr("xmlns") && !el.attr("xmlns").equals(el.tag().namespace()))
-                error("Invalid xmlns attribute [%s] on tag [%s]", el.attr("xmlns"), el.tagName());
-        }
-        onNodeInserted(node, token);
-    }
-
-    /** Cleanup duplicate attributes. **/
-    private void dedupeAttributes(StartTag startTag) {
-        if (startTag.hasAttributes() && !startTag.attributes.isEmpty()) {
-            int dupes = startTag.attributes.deduplicate(settings);
-            if (dupes > 0) {
-                error("Dropped duplicate attribute(s) in tag [%s]", startTag.normalName);
-            }
-        }
-    }
-
-    Element pop() {
-        int size = stack.size();
-        return stack.remove(size-1);
-    }
-
-    void push(Element element) {
-        stack.add(element);
+        onNodeInserted(node);
     }
 
     ArrayList<Element> getStack() {
@@ -507,6 +476,7 @@ boolean removeFromStack(Element el) {
             Element next = stack.get(pos);
             if (next == el) {
                 stack.remove(pos);
+                onNodeClosed(el);
                 return true;
             }
         }
@@ -517,11 +487,8 @@ boolean removeFromStack(Element el) {
     @Nullable
     Element popStackToClose(String elName) {
         for (int pos = stack.size() -1; pos >= 0; pos--) {
-            Element el = stack.get(pos);
-            stack.remove(pos);
+            Element el = pop();
             if (el.normalName().equals(elName) && NamespaceHtml.equals(el.tag().namespace())) {
-                if (currentToken instanceof Token.EndTag)
-                    onNodeClosed(el, currentToken);
                 return el;
             }
         }
@@ -532,11 +499,8 @@ Element popStackToClose(String elName) {
     @Nullable
     Element popStackToCloseAnyNamespace(String elName) {
         for (int pos = stack.size() -1; pos >= 0; pos--) {
-            Element el = stack.get(pos);
-            stack.remove(pos);
+            Element el = pop();
             if (el.normalName().equals(elName)) {
-                if (currentToken instanceof Token.EndTag)
-                    onNodeClosed(el, currentToken);
                 return el;
             }
         }
@@ -546,11 +510,8 @@ Element popStackToCloseAnyNamespace(String elName) {
     /** Pops the stack until one of the given HTML elements is removed. */
     void popStackToClose(String... elNames) { // elnames is sorted, comes from Constants
         for (int pos = stack.size() -1; pos >= 0; pos--) {
-            Element el = stack.get(pos);
-            stack.remove(pos);
+            Element el = pop();
             if (inSorted(el.normalName(), elNames) && NamespaceHtml.equals(el.tag().namespace())) {
-                if (currentToken instanceof Token.EndTag)
-                    onNodeClosed(el, currentToken);
                 break;
             }
         }
@@ -576,7 +537,7 @@ private void clearStackToContext(String... nodeNames) {
                 (StringUtil.in(next.normalName(), nodeNames) || next.normalName().equals("html")))
                 break;
             else
-                stack.remove(pos);
+                pop();
         }
     }
 
@@ -601,7 +562,7 @@ void replaceOnStack(Element out, Element in) {
         replaceInQueue(stack, out, in);
     }
 
-    private void replaceInQueue(ArrayList<Element> queue, Element out, Element in) {
+    private static void replaceInQueue(ArrayList<Element> queue, Element out, Element in) {
         int i = queue.lastIndexOf(out);
         Validate.isTrue(i != -1);
         queue.set(i, in);
@@ -695,13 +656,13 @@ boolean resetInsertionMode() {
     /** Places the body back onto the stack and moves to InBody, for cases in AfterBody / AfterAfterBody when more content comes */
     void resetBody() {
         if (!onStack("body")) {
-            stack.add(doc.body());
+            stack.add(doc.body()); // not onNodeInserted, as already seen
         }
         transition(HtmlTreeBuilderState.InBody);
     }
 
     // todo: tidy up in specific scope methods
-    private String[] specificScopeTarget = {null};
+    private final String[] specificScopeTarget = {null};
 
     private boolean inSpecificScope(String targetName, String[] baseTypes, String[] extraTypes) {
         specificScopeTarget[0] = targetName;
@@ -808,7 +769,7 @@ void setFormElement(FormElement formElement) {
     }
 
     void resetPendingTableCharacters() {
-        pendingTableCharacters = new ArrayList<>();
+        pendingTableCharacters.clear();
     }
 
     List<Token.Character> getPendingTableCharacters() {
@@ -862,7 +823,7 @@ void closeElement(String name) {
         popStackToClose(name);
     }
 
-    boolean isSpecial(Element el) {
+    static boolean isSpecial(Element el) {
         // todo: mathml's mi, mo, mn
         // todo: svg's foreigObject, desc, title
         String name = el.normalName();
@@ -925,7 +886,7 @@ void checkActiveFormattingElements(Element in){
         }
     }
 
-    private boolean isSameFormattingElement(Element a, Element b) {
+    private static boolean isSameFormattingElement(Element a, Element b) {
         // same if: same namespace, tag, and attributes. Element.equals only checks tag, might in future check children
         return a.normalName().equals(b.normalName()) &&
                 // a.namespace().equals(b.namespace()) &&
@@ -962,7 +923,7 @@ void reconstructFormattingElements() {
             // 8. create new element from element, 9 insert into current node, onto stack
             skip = false; // can only skip increment from 4.
             Element newEl = new Element(tagFor(entry.normalName(), settings), null, entry.attributes().clone());
-            insert(newEl);
+            doInsertElement(newEl, null);
 
             // 10. replace entry with new entry
             formattingElements.set(pos, newEl);
@@ -1068,7 +1029,7 @@ public String toString() {
                 '}';
     }
 
-    protected boolean isContentForTagData(final String normalName) {
+    @Override protected boolean isContentForTagData(final String normalName) {
         return (normalName.equals("script") || normalName.equals("style"));
     }
 }
diff --git a/src/main/java/org/jsoup/parser/HtmlTreeBuilderState.java b/src/main/java/org/jsoup/parser/HtmlTreeBuilderState.java
index fe0a9765bd..526619fc29 100644
--- a/src/main/java/org/jsoup/parser/HtmlTreeBuilderState.java
+++ b/src/main/java/org/jsoup/parser/HtmlTreeBuilderState.java
@@ -18,11 +18,11 @@
  */
 enum HtmlTreeBuilderState {
     Initial {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
                 return true; // ignore whitespace until we get the first content
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype()) {
                 // todo: parse error check on expected doctypes
                 // todo: quirk state check on doctype ids
@@ -31,7 +31,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     tb.settings.normalizeTag(d.getName()), d.getPublicIdentifier(), d.getSystemIdentifier());
                 doctype.setPubSysKey(d.getPubSysKey());
                 tb.getDocument().appendChild(doctype);
-                tb.onNodeInserted(doctype, t);
+                tb.onNodeInserted(doctype);
                 if (d.isForceQuirks())
                     tb.getDocument().quirksMode(Document.QuirksMode.quirks);
                 tb.transition(BeforeHtml);
@@ -44,16 +44,16 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     BeforeHtml {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isDoctype()) {
                 tb.error(this);
                 return false;
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (isWhitespace(t)) {
-                tb.insert(t.asCharacter()); // out of spec - include whitespace
+                tb.insertCharacterNode(t.asCharacter()); // out of spec - include whitespace
             } else if (t.isStartTag() && t.asStartTag().normalName().equals("html")) {
-                tb.insert(t.asStartTag());
+                tb.insertElementFor(t.asStartTag());
                 tb.transition(BeforeHead);
             } else if (t.isEndTag() && (inSorted(t.asEndTag().normalName(), BeforeHtmlToHead))) {
                 return anythingElse(t, tb);
@@ -67,24 +67,24 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
 
         private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
-            tb.insertStartTag("html");
+            tb.processStartTag("html");
             tb.transition(BeforeHead);
             return tb.process(t);
         }
     },
     BeforeHead {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
-                tb.insert(t.asCharacter()); // out of spec - include whitespace
+                tb.insertCharacterNode(t.asCharacter()); // out of spec - include whitespace
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype()) {
                 tb.error(this);
                 return false;
             } else if (t.isStartTag() && t.asStartTag().normalName().equals("html")) {
                 return InBody.process(t, tb); // does not transition
             } else if (t.isStartTag() && t.asStartTag().normalName().equals("head")) {
-                Element head = tb.insert(t.asStartTag());
+                Element head = tb.insertElementFor(t.asStartTag());
                 tb.setHeadElement(head);
                 tb.transition(InHead);
             } else if (t.isEndTag() && (inSorted(t.asEndTag().normalName(), BeforeHtmlToHead))) {
@@ -101,14 +101,14 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     InHead {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
-                tb.insert(t.asCharacter()); // out of spec - include whitespace
+                tb.insertCharacterNode(t.asCharacter()); // out of spec - include whitespace
                 return true;
             }
             switch (t.type) {
                 case Comment:
-                    tb.insert(t.asComment());
+                    tb.insertCommentNode(t.asComment());
                     break;
                 case Doctype:
                     tb.error(this);
@@ -119,12 +119,12 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     if (name.equals("html")) {
                         return InBody.process(t, tb);
                     } else if (inSorted(name, InHeadEmpty)) {
-                        Element el = tb.insertEmpty(start);
+                        Element el = tb.insertEmptyElementFor(start);
                         // jsoup special: update base the first time it is seen
                         if (name.equals("base") && el.hasAttr("href"))
                             tb.maybeSetBaseUri(el);
                     } else if (name.equals("meta")) {
-                        tb.insertEmpty(start);
+                        tb.insertEmptyElementFor(start);
                         // todo: charset switches
                     } else if (name.equals("title")) {
                         handleRcData(start, tb);
@@ -132,19 +132,19 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                         handleRawtext(start, tb);
                     } else if (name.equals("noscript")) {
                         // else if noscript && scripting flag = true: rawtext (jsoup doesn't run script, to handle as noscript)
-                        tb.insert(start);
+                        tb.insertElementFor(start);
                         tb.transition(InHeadNoscript);
                     } else if (name.equals("script")) {
                         // skips some script rules as won't execute them
                         tb.tokeniser.transition(TokeniserState.ScriptData);
                         tb.markInsertionMode();
                         tb.transition(Text);
-                        tb.insert(start);
+                        tb.insertElementFor(start);
                     } else if (name.equals("head")) {
                         tb.error(this);
                         return false;
                     } else if (name.equals("template")) {
-                        tb.insert(start);
+                        tb.insertElementFor(start);
                         tb.insertMarkerToFormattingElements();
                         tb.framesetOk(false);
                         tb.transition(InTemplate);
@@ -190,7 +190,7 @@ private boolean anythingElse(Token t, TreeBuilder tb) {
         }
     },
     InHeadNoscript {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isDoctype()) {
                 tb.error(this);
             } else if (t.isStartTag() && t.asStartTag().normalName().equals("html")) {
@@ -217,16 +217,16 @@ private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
             // https://html.spec.whatwg.org/multipage/parsing.html#parsing-main-inheadnoscript
             // allows content to be inserted as data
             tb.error(this);
-            tb.insert(new Token.Character().data(t.toString()));
+            tb.insertCharacterNode(new Token.Character().data(t.toString()));
             return true;
         }
     },
     AfterHead {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
-                tb.insert(t.asCharacter());
+                tb.insertCharacterNode(t.asCharacter());
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype()) {
                 tb.error(this);
             } else if (t.isStartTag()) {
@@ -235,11 +235,11 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                 if (name.equals("html")) {
                     return tb.process(t, InBody);
                 } else if (name.equals("body")) {
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.framesetOk(false);
                     tb.transition(InBody);
                 } else if (name.equals("frameset")) {
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.transition(InFrameset);
                 } else if (inSorted(name, InBodyStartToHead)) {
                     tb.error(this);
@@ -277,7 +277,7 @@ private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
         }
     },
     InBody {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             switch (t.type) {
                 case Character: {
                     Token.Character c = t.asCharacter();
@@ -287,16 +287,16 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                         return false;
                     } else if (tb.framesetOk() && isWhitespace(c)) { // don't check if whitespace if frames already closed
                         tb.reconstructFormattingElements();
-                        tb.insert(c);
+                        tb.insertCharacterNode(c);
                     } else {
                         tb.reconstructFormattingElements();
-                        tb.insert(c);
+                        tb.insertCharacterNode(c);
                         tb.framesetOk(false);
                     }
                     break;
                 }
                 case Comment: {
-                    tb.insert(t.asComment());
+                    tb.insertCommentNode(t.asComment());
                     break;
                 }
                 case Doctype: {
@@ -338,13 +338,13 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         }
                     }
                     tb.reconstructFormattingElements();
-                    el = tb.insert(startTag);
+                    el = tb.insertElementFor(startTag);
                     tb.pushActiveFormattingElements(el);
                     break;
                 case "span":
                     // same as final else, but short circuits lots of checks
                     tb.reconstructFormattingElements();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
                 case "li":
                     tb.framesetOk(false);
@@ -355,13 +355,13 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                             tb.processEndTag("li");
                             break;
                         }
-                        if (tb.isSpecial(el) && !inSorted(el.normalName(), Constants.InBodyStartLiBreakers))
+                        if (HtmlTreeBuilder.isSpecial(el) && !inSorted(el.normalName(), Constants.InBodyStartLiBreakers))
                             break;
                     }
                     if (tb.inButtonScope("p")) {
                         tb.processEndTag("p");
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
                 case "html":
                     tb.error(this);
@@ -411,7 +411,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         // pop up to html element
                         while (stack.size() > 1)
                             stack.remove(stack.size() - 1);
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                         tb.transition(InFrameset);
                     }
                     break;
@@ -423,13 +423,13 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     if (tb.inButtonScope("p")) {
                         tb.closeElement("p");
                     }
-                    tb.insertForm(startTag, true, true); // won't associate to any template
+                    tb.insertFormElement(startTag, true, true); // won't associate to any template
                     break;
                 case "plaintext":
                     if (tb.inButtonScope("p")) {
                         tb.processEndTag("p");
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.tokeniser.transition(TokeniserState.PLAINTEXT); // once in, never gets out
                     break;
                 case "button":
@@ -440,7 +440,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         tb.process(startTag);
                     } else {
                         tb.reconstructFormattingElements();
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                         tb.framesetOk(false);
                     }
                     break;
@@ -451,20 +451,20 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         tb.processEndTag("nobr");
                         tb.reconstructFormattingElements();
                     }
-                    el = tb.insert(startTag);
+                    el = tb.insertElementFor(startTag);
                     tb.pushActiveFormattingElements(el);
                     break;
                 case "table":
                     if (tb.getDocument().quirksMode() != Document.QuirksMode.quirks && tb.inButtonScope("p")) {
                         tb.processEndTag("p");
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.framesetOk(false);
                     tb.transition(InTable);
                     break;
                 case "input":
                     tb.reconstructFormattingElements();
-                    el = tb.insertEmpty(startTag);
+                    el = tb.insertEmptyElementFor(startTag);
                     if (!el.attr("type").equalsIgnoreCase("hidden"))
                         tb.framesetOk(false);
                     break;
@@ -472,14 +472,14 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     if (tb.inButtonScope("p")) {
                         tb.processEndTag("p");
                     }
-                    tb.insertEmpty(startTag);
+                    tb.insertEmptyElementFor(startTag);
                     tb.framesetOk(false);
                     break;
                 case "image":
                     if (tb.getFromStack("svg") == null)
                         return tb.process(startTag.name("img")); // change <image> to <img>, unless in svg
                     else
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                     break;
                 case "isindex":
                     // how much do we care about the early 90s?
@@ -519,7 +519,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     tb.processEndTag("form");
                     break;
                 case "textarea":
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     if (!startTag.isSelfClosing()) {
                         tb.tokeniser.transition(TokeniserState.Rcdata);
                         tb.markInsertionMode();
@@ -545,7 +545,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     break;
                 case "select":
                     tb.reconstructFormattingElements();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.framesetOk(false);
                     if (startTag.selfClosing) break; // don't change states if not added to the stack
 
@@ -557,11 +557,11 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     break;
                 case "math":
                     tb.reconstructFormattingElements();
-                    tb.insertForeign(startTag, Parser.NamespaceMathml);
+                    tb.insertForeignElementFor(startTag, Parser.NamespaceMathml);
                     break;
                 case "svg":
                     tb.reconstructFormattingElements();
-                    tb.insertForeign(startTag, Parser.NamespaceSvg);
+                    tb.insertForeignElementFor(startTag, Parser.NamespaceSvg);
                     break;
                 // static final String[] Headings = new String[]{"h1", "h2", "h3", "h4", "h5", "h6"};
                 case "h1":
@@ -577,7 +577,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         tb.error(this);
                         tb.pop();
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
                 // static final String[] InBodyStartPreListing = new String[]{"listing", "pre"};
                 case "pre":
@@ -585,7 +585,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     if (tb.inButtonScope("p")) {
                         tb.processEndTag("p");
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.reader.matchConsume("\n"); // ignore LF if next token
                     tb.framesetOk(false);
                     break;
@@ -602,13 +602,13 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                             tb.processEndTag(el.normalName());
                             break;
                         }
-                        if (tb.isSpecial(el) && !inSorted(el.normalName(), Constants.InBodyStartLiBreakers))
+                        if (HtmlTreeBuilder.isSpecial(el) && !inSorted(el.normalName(), Constants.InBodyStartLiBreakers))
                             break;
                     }
                     if (tb.inButtonScope("p")) {
                         tb.processEndTag("p");
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
 
                 case "optgroup":
@@ -616,7 +616,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                     if (tb.currentElementIs("option"))
                         tb.processEndTag("option");
                     tb.reconstructFormattingElements();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
 
                 case "rb":
@@ -626,7 +626,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         if (!tb.currentElementIs("ruby"))
                             tb.error(this);
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
 
                 case "rp":
@@ -636,7 +636,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                         if (!tb.currentElementIs("rtc") && !tb.currentElementIs("ruby"))
                             tb.error(this);
                     }
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     break;
 
                 // InBodyStartEmptyFormatters:
@@ -647,7 +647,7 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                 case "keygen":
                 case "wbr":
                     tb.reconstructFormattingElements();
-                    tb.insertEmpty(startTag);
+                    tb.insertEmptyElementFor(startTag);
                     tb.framesetOk(false);
                     break;
                 // Formatters:
@@ -664,33 +664,33 @@ private boolean inBodyStartTag(Token t, HtmlTreeBuilder tb) {
                 case "tt":
                 case "u":
                     tb.reconstructFormattingElements();
-                    el = tb.insert(startTag);
+                    el = tb.insertElementFor(startTag);
                     tb.pushActiveFormattingElements(el);
                     break;
                 default:
                     // todo - bring scan groups in if desired
                     if (!Tag.isKnownTag(name)) { // no special rules for custom tags
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                     } else if (inSorted(name, Constants.InBodyStartPClosers)) {
                         if (tb.inButtonScope("p")) {
                             tb.processEndTag("p");
                         }
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                     } else if (inSorted(name, Constants.InBodyStartToHead)) {
                         return tb.process(t, InHead);
                     } else if (inSorted(name, Constants.InBodyStartApplets)) {
                         tb.reconstructFormattingElements();
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                         tb.insertMarkerToFormattingElements();
                         tb.framesetOk(false);
                     } else if (inSorted(name, Constants.InBodyStartMedia)) {
-                        tb.insertEmpty(startTag);
+                        tb.insertEmptyElementFor(startTag);
                     } else if (inSorted(name, Constants.InBodyStartDrop)) {
                         tb.error(this);
                         return false;
                     } else {
                         tb.reconstructFormattingElements();
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                     }
             }
             return true;
@@ -727,6 +727,7 @@ private boolean inBodyEndTag(Token t, HtmlTreeBuilder tb) {
                     } else {
                         if (tb.onStackNot(InBodyEndOtherErrors))
                             tb.error(this);
+                        tb.onNodeClosed(tb.getFromStack("body")); // track source position of close; everything is still on stack in case of trailers
                         tb.transition(AfterBody);
                     }
                     break;
@@ -862,7 +863,7 @@ boolean anyOtherEndTag(Token t, HtmlTreeBuilder tb) {
                     tb.popStackToClose(name);
                     break;
                 } else {
-                    if (tb.isSpecial(node)) {
+                    if (HtmlTreeBuilder.isSpecial(node)) {
                         tb.error(this);
                         return false;
                     }
@@ -906,7 +907,7 @@ else if (!tb.onStack(formatEl)) {
                         seenFormattingElement = true;
                         // Let a bookmark note the position of the formatting element in the list of active formatting elements relative to the elements on either side of it in the list.
                         bookmark = tb.positionOfElement(el);
-                    } else if (seenFormattingElement && tb.isSpecial(el)) {
+                    } else if (seenFormattingElement && HtmlTreeBuilder.isSpecial(el)) {
                         furthestBlock = el;
                         break;
                     }
@@ -973,9 +974,9 @@ else if (!tb.onStack(formatEl)) {
     },
     Text {
         // in script, style etc. normally treated as data tags
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isCharacter()) {
-                tb.insert(t.asCharacter());
+                tb.insertCharacterNode(t.asCharacter());
             } else if (t.isEOF()) {
                 tb.error(this);
                 // if current node is script: already started
@@ -991,14 +992,14 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     InTable {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isCharacter() && inSorted(tb.currentElement().normalName(), InTableFoster)) {
                 tb.resetPendingTableCharacters();
                 tb.markInsertionMode();
                 tb.transition(InTableText);
                 return tb.process(t);
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
                 return true;
             } else if (t.isDoctype()) {
                 tb.error(this);
@@ -1009,11 +1010,11 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                 if (name.equals("caption")) {
                     tb.clearStackToTableContext();
                     tb.insertMarkerToFormattingElements();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.transition(InCaption);
                 } else if (name.equals("colgroup")) {
                     tb.clearStackToTableContext();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.transition(InColumnGroup);
                 } else if (name.equals("col")) {
                     tb.clearStackToTableContext();
@@ -1021,7 +1022,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     return tb.process(t);
                 } else if (inSorted(name, InTableToBody)) {
                     tb.clearStackToTableContext();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.transition(InTableBody);
                 } else if (inSorted(name, InTableAddBody)) {
                     tb.clearStackToTableContext();
@@ -1035,7 +1036,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                         tb.popStackToClose(name);
                         if (!tb.resetInsertionMode()) {
                             // not per spec - but haven't transitioned out of table. so try something else
-                            tb.insert(startTag);
+                            tb.insertElementFor(startTag);
                             return true;
                         }
                         return tb.process(t);
@@ -1046,14 +1047,14 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     if (!(startTag.hasAttributes() && startTag.attributes.get("type").equalsIgnoreCase("hidden"))) {
                         return anythingElse(t, tb);
                     } else {
-                        tb.insertEmpty(startTag);
+                        tb.insertEmptyElementFor(startTag);
                     }
                 } else if (name.equals("form")) {
                     tb.error(this);
                     if (tb.getFormElement() != null || tb.onStack("template"))
                         return false;
                     else {
-                        tb.insertForm(startTag, false, false); // not added to stack. can associate to template
+                        tb.insertFormElement(startTag, false, false); // not added to stack. can associate to template
                     }
                 } else {
                     return anythingElse(t, tb);
@@ -1097,7 +1098,7 @@ boolean anythingElse(Token t, HtmlTreeBuilder tb) {
         }
     },
     InTableText {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.type == Token.TokenType.Character) {
                 Token.Character c = t.asCharacter();
                 if (c.getData().equals(nullString)) {
@@ -1107,8 +1108,11 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     tb.addPendingTableCharacters(c);
                 }
             } else {
+                // insert gathered table text into the correct element:
                 if (tb.getPendingTableCharacters().size() > 0) {
+                    final Token og = tb.currentToken; // update current token, so we can track cursor pos correctly
                     for (Token.Character c : tb.getPendingTableCharacters()) {
+                        tb.currentToken = c;
                         if (!isWhitespace(c)) {
                             // InTable anything else section:
                             tb.error(this);
@@ -1120,8 +1124,9 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                                 tb.process(c, InBody);
                             }
                         } else
-                            tb.insert(c);
+                            tb.insertCharacterNode(c);
                     }
+                    tb.currentToken = og;
                     tb.resetPendingTableCharacters();
                 }
                 tb.transition(tb.originalState());
@@ -1131,7 +1136,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     InCaption {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isEndTag() && t.asEndTag().normalName().equals("caption")) {
                 Token.EndTag endTag = t.asEndTag();
                 String name = endTag.normalName();
@@ -1164,14 +1169,14 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     InColumnGroup {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
-                tb.insert(t.asCharacter());
+                tb.insertCharacterNode(t.asCharacter());
                 return true;
             }
             switch (t.type) {
                 case Comment:
-                    tb.insert(t.asComment());
+                    tb.insertCommentNode(t.asComment());
                     break;
                 case Doctype:
                     tb.error(this);
@@ -1182,7 +1187,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                         case "html":
                             return tb.process(t, InBody);
                         case "col":
-                            tb.insertEmpty(startTag);
+                            tb.insertEmptyElementFor(startTag);
                             break;
                         case "template":
                             tb.process(t, InHead);
@@ -1234,14 +1239,14 @@ private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
         }
     },
     InTableBody {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             switch (t.type) {
                 case StartTag:
                     Token.StartTag startTag = t.asStartTag();
                     String name = startTag.normalName();
                     if (name.equals("tr")) {
                         tb.clearStackToTableBodyContext();
-                        tb.insert(startTag);
+                        tb.insertElementFor(startTag);
                         tb.transition(InRow);
                     } else if (inSorted(name, InCellNames)) {
                         tb.error(this);
@@ -1294,14 +1299,14 @@ private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
         }
     },
     InRow {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isStartTag()) {
                 Token.StartTag startTag = t.asStartTag();
                 String name = startTag.normalName();
 
                 if (inSorted(name, InCellNames)) { // th, th
                     tb.clearStackToTableRowContext();
-                    tb.insert(startTag);
+                    tb.insertElementFor(startTag);
                     tb.transition(InCell);
                     tb.insertMarkerToFormattingElements();
                 } else if (inSorted(name, InRowMissing)) { // "caption", "col", "colgroup", "tbody", "tfoot", "thead", "tr"
@@ -1367,7 +1372,7 @@ private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
         }
     },
     InCell {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isEndTag()) {
                 Token.EndTag endTag = t.asEndTag();
                 String name = endTag.normalName();
@@ -1423,7 +1428,7 @@ private void closeCell(HtmlTreeBuilder tb) {
         }
     },
     InSelect {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             switch (t.type) {
                 case Character:
                     Token.Character c = t.asCharacter();
@@ -1431,11 +1436,11 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                         tb.error(this);
                         return false;
                     } else {
-                        tb.insert(c);
+                        tb.insertCharacterNode(c);
                     }
                     break;
                 case Comment:
-                    tb.insert(t.asComment());
+                    tb.insertCommentNode(t.asComment());
                     break;
                 case Doctype:
                     tb.error(this);
@@ -1448,13 +1453,13 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     else if (name.equals("option")) {
                         if (tb.currentElementIs("option"))
                             tb.processEndTag("option");
-                        tb.insert(start);
+                        tb.insertElementFor(start);
                     } else if (name.equals("optgroup")) {
                         if (tb.currentElementIs("option"))
                             tb.processEndTag("option"); // pop option and flow to pop optgroup
                         if (tb.currentElementIs("optgroup"))
                             tb.processEndTag("optgroup");
-                        tb.insert(start);
+                        tb.insertElementFor(start);
                     } else if (name.equals("select")) {
                         tb.error(this);
                         return tb.processEndTag("select");
@@ -1519,7 +1524,7 @@ private boolean anythingElse(Token t, HtmlTreeBuilder tb) {
         }
     },
     InSelectInTable {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isStartTag() && inSorted(t.asStartTag().normalName(), InSelectTableEnd)) {
                 tb.error(this);
                 tb.popStackToClose("select");
@@ -1539,7 +1544,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     InTemplate {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             final String name;
             switch (t.type) {
                 case Character:
@@ -1608,16 +1613,16 @@ else if (name.equals("col")) {
         }
     },
     AfterBody {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
+            Element html = tb.getFromStack("html");
             if (isWhitespace(t)) {
                 // spec deviation - currently body is still on stack, but we want this to go to the html node
-                Element html = tb.getFromStack("html");
                 if (html != null)
-                    tb.insert(t.asCharacter(), html);
+                    tb.insertCharacterToElement(t.asCharacter(), html);
                 else
                     tb.process(t, InBody); // will get into body
             } else if (t.isComment()) {
-                tb.insert(t.asComment()); // into html node
+                tb.insertCommentNode(t.asComment()); // into html node
             } else if (t.isDoctype()) {
                 tb.error(this);
                 return false;
@@ -1628,6 +1633,7 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     tb.error(this);
                     return false;
                 } else {
+                    if (html != null) tb.onNodeClosed(html); // track source position of close; everything is still on stack in case of trailers
                     tb.transition(AfterAfterBody);
                 }
             } else if (t.isEOF()) {
@@ -1641,11 +1647,11 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     InFrameset {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
-                tb.insert(t.asCharacter());
+                tb.insertCharacterNode(t.asCharacter());
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype()) {
                 tb.error(this);
                 return false;
@@ -1655,10 +1661,10 @@ boolean process(Token t, HtmlTreeBuilder tb) {
                     case "html":
                         return tb.process(start, InBody);
                     case "frameset":
-                        tb.insert(start);
+                        tb.insertElementFor(start);
                         break;
                     case "frame":
-                        tb.insertEmpty(start);
+                        tb.insertEmptyElementFor(start);
                         break;
                     case "noframes":
                         return tb.process(start, InHead);
@@ -1689,11 +1695,11 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     AfterFrameset {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (isWhitespace(t)) {
-                tb.insert(t.asCharacter());
+                tb.insertCharacterNode(t.asCharacter());
             } else if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype()) {
                 tb.error(this);
                 return false;
@@ -1713,15 +1719,15 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     AfterAfterBody {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype() || (t.isStartTag() && t.asStartTag().normalName().equals("html"))) {
                 return tb.process(t, InBody);
             } else if (isWhitespace(t)) {
                 // spec deviation - body and html still on stack, but want this space to go after </html>
                 Element doc = tb.getDocument();
-                tb.insert(t.asCharacter(), doc);
+                tb.insertCharacterToElement(t.asCharacter(), doc);
             }else if (t.isEOF()) {
                 // nice work chuck
             } else {
@@ -1733,9 +1739,9 @@ boolean process(Token t, HtmlTreeBuilder tb) {
         }
     },
     AfterAfterFrameset {
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             if (t.isComment()) {
-                tb.insert(t.asComment());
+                tb.insertCommentNode(t.asComment());
             } else if (t.isDoctype() || isWhitespace(t) || (t.isStartTag() && t.asStartTag().normalName().equals("html"))) {
                 return tb.process(t, InBody);
             } else if (t.isEOF()) {
@@ -1751,21 +1757,21 @@ boolean process(Token t, HtmlTreeBuilder tb) {
     },
     ForeignContent {
         // https://html.spec.whatwg.org/multipage/parsing.html#parsing-main-inforeign
-        boolean process(Token t, HtmlTreeBuilder tb) {
+        @Override boolean process(Token t, HtmlTreeBuilder tb) {
             switch (t.type) {
                 case Character:
                     Token.Character c = t.asCharacter();
                     if (c.getData().equals(nullString))
                         tb.error(this);
                     else if (HtmlTreeBuilderState.isWhitespace(c))
-                        tb.insert(c);
+                        tb.insertCharacterNode(c);
                     else {
-                        tb.insert(c);
+                        tb.insertCharacterNode(c);
                         tb.framesetOk(false);
                     }
                     break;
                 case Comment:
-                    tb.insert(t.asComment());
+                    tb.insertCommentNode(t.asComment());
                     break;
                 case Doctype:
                     tb.error(this);
@@ -1782,7 +1788,7 @@ else if (HtmlTreeBuilderState.isWhitespace(c))
 
                     // Any other start:
                     // (whatwg says to fix up tag name and attribute case per a table - we will preserve original case instead)
-                    tb.insertForeign(start, tb.currentElement().tag().namespace());
+                    tb.insertForeignElementFor(start, tb.currentElement().tag().namespace());
                     // (self-closing handled in insert)
                     // if self-closing svg script -- level and execution elided
                     break;
@@ -1846,14 +1852,14 @@ private static void handleRcData(Token.StartTag startTag, HtmlTreeBuilder tb) {
         tb.tokeniser.transition(TokeniserState.Rcdata);
         tb.markInsertionMode();
         tb.transition(Text);
-        tb.insert(startTag);
+        tb.insertElementFor(startTag);
     }
 
     private static void handleRawtext(Token.StartTag startTag, HtmlTreeBuilder tb) {
         tb.tokeniser.transition(TokeniserState.Rawtext);
         tb.markInsertionMode();
         tb.transition(Text);
-        tb.insert(startTag);
+        tb.insertElementFor(startTag);
     }
 
     // lists of tags to search through
diff --git a/src/main/java/org/jsoup/parser/ParseError.java b/src/main/java/org/jsoup/parser/ParseError.java
index 7571aa4902..a82b78356b 100644
--- a/src/main/java/org/jsoup/parser/ParseError.java
+++ b/src/main/java/org/jsoup/parser/ParseError.java
@@ -4,19 +4,19 @@
  * A Parse Error records an error in the input HTML that occurs in either the tokenisation or the tree building phase.
  */
 public class ParseError {
-    private int pos;
-    private String cursorPos;
-    private String errorMsg;
+    private final int pos;
+    private final String cursorPos;
+    private final String errorMsg;
 
     ParseError(CharacterReader reader, String errorMsg) {
         pos = reader.pos();
-        cursorPos = reader.cursorPos();
+        cursorPos = reader.posLineCol();
         this.errorMsg = errorMsg;
     }
 
     ParseError(CharacterReader reader, String errorFormat, Object... args) {
         pos = reader.pos();
-        cursorPos = reader.cursorPos();
+        cursorPos = reader.posLineCol();
         this.errorMsg = String.format(errorFormat, args);
     }
 
diff --git a/src/main/java/org/jsoup/parser/ParseSettings.java b/src/main/java/org/jsoup/parser/ParseSettings.java
index 56ff672d05..aad82da0a9 100644
--- a/src/main/java/org/jsoup/parser/ParseSettings.java
+++ b/src/main/java/org/jsoup/parser/ParseSettings.java
@@ -1,7 +1,8 @@
 package org.jsoup.parser;
 
 import org.jsoup.nodes.Attributes;
-import javax.annotation.Nullable;
+import org.jspecify.annotations.Nullable;
+
 import static org.jsoup.internal.Normalizer.lowerCase;
 
 /**
diff --git a/src/main/java/org/jsoup/parser/Parser.java b/src/main/java/org/jsoup/parser/Parser.java
index 123ddc3f8d..7ae7f31cd1 100644
--- a/src/main/java/org/jsoup/parser/Parser.java
+++ b/src/main/java/org/jsoup/parser/Parser.java
@@ -245,7 +245,7 @@ public static Document parseBodyFragment(String bodyHtml, String baseUri) {
      * @return an unescaped string
      */
     public static String unescapeEntities(String string, boolean inAttribute) {
-        Tokeniser tokeniser = new Tokeniser(new CharacterReader(string), ParseErrorList.noTracking());
+        Tokeniser tokeniser = new Tokeniser(new CharacterReader(string), ParseErrorList.noTracking(), false);
         return tokeniser.unescapeEntities(inAttribute);
     }
 
diff --git a/src/main/java/org/jsoup/parser/Token.java b/src/main/java/org/jsoup/parser/Token.java
index 81ad3fb524..c813e5d889 100644
--- a/src/main/java/org/jsoup/parser/Token.java
+++ b/src/main/java/org/jsoup/parser/Token.java
@@ -2,8 +2,14 @@
 
 import org.jsoup.helper.Validate;
 import org.jsoup.nodes.Attributes;
+import org.jsoup.nodes.Range;
+import org.jspecify.annotations.Nullable;
+
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.jsoup.internal.SharedConstants.*;
 
-import javax.annotation.Nullable;
 
 /**
  * Parse tokens for the Tokeniser.
@@ -102,37 +108,52 @@ public String toString() {
 
     static abstract class Tag extends Token {
         @Nullable protected String tagName;
-        @Nullable protected String normalName; // lc version of tag name, for case insensitive tree build
+        @Nullable protected String normalName; // lc version of tag name, for case-insensitive tree build
+        boolean selfClosing = false;
+        @Nullable Attributes attributes; // start tags get attributes on construction. End tags get attributes on first new attribute (but only for parser convenience, not used).
 
-        private final StringBuilder attrName = new StringBuilder(); // try to get attr names and vals in one shot, vs Builder
-        @Nullable private String attrNameS;
+        @Nullable private String attrName; // try to get attr names and vals in one shot, vs Builder
+        private final StringBuilder attrNameSb = new StringBuilder();
         private boolean hasAttrName = false;
 
-        private final StringBuilder attrValue = new StringBuilder();
-        @Nullable private String attrValueS;
+        @Nullable private String attrValue;
+        private final StringBuilder attrValueSb = new StringBuilder();
         private boolean hasAttrValue = false;
         private boolean hasEmptyAttrValue = false; // distinguish boolean attribute from empty string value
 
-        boolean selfClosing = false;
-        @Nullable Attributes attributes; // start tags get attributes on construction. End tags get attributes on first new attribute (but only for parser convenience, not used).
+        // attribute source range tracking
+        final boolean trackSource;
+        int attrNameStart, attrNameEnd, attrValStart, attrValEnd;
+
+        Tag(boolean trackSource) {
+            this.trackSource = trackSource;
+        }
 
         @Override
         Tag reset() {
             super.reset();
             tagName = null;
             normalName = null;
-            reset(attrName);
-            attrNameS = null;
-            hasAttrName = false;
-            reset(attrValue);
-            attrValueS = null;
-            hasEmptyAttrValue = false;
-            hasAttrValue = false;
             selfClosing = false;
             attributes = null;
+            resetPendingAttr();
             return this;
         }
 
+        private void resetPendingAttr() {
+            reset(attrNameSb);
+            attrName = null;
+            hasAttrName = false;
+
+            reset(attrValueSb);
+            attrValue = null;
+            hasEmptyAttrValue = false;
+            hasAttrValue = false;
+
+            if (trackSource)
+                attrNameStart = attrNameEnd = attrValStart = attrValEnd = Unset;
+        }
+
         /* Limits runaway crafted HTML from spewing attributes and getting a little sluggish in ensureCapacity.
         Real-world HTML will P99 around 8 attributes, so plenty of headroom. Implemented here and not in the Attributes
         object so that API users can add more if ever required. */
@@ -144,28 +165,52 @@ final void newAttribute() {
 
             if (hasAttrName && attributes.size() < MaxAttributes) {
                 // the tokeniser has skipped whitespace control chars, but trimming could collapse to empty for other control codes, so verify here
-                String name = attrName.length() > 0 ? attrName.toString() : attrNameS;
+                String name = attrNameSb.length() > 0 ? attrNameSb.toString() : attrName;
                 name = name.trim();
                 if (name.length() > 0) {
                     String value;
                     if (hasAttrValue)
-                        value = attrValue.length() > 0 ? attrValue.toString() : attrValueS;
+                        value = attrValueSb.length() > 0 ? attrValueSb.toString() : attrValue;
                     else if (hasEmptyAttrValue)
                         value = "";
                     else
                         value = null;
-                    // note that we add, not put. So that the first is kept, and rest are deduped, once in a context where case sensitivity is known (the appropriate tree builder).
+                    // note that we add, not put. So that the first is kept, and rest are deduped, once in a context where case sensitivity is known, and we can warn for duplicates.
                     attributes.add(name, value);
+
+                    trackAttributeRange(name);
                 }
             }
-            reset(attrName);
-            attrNameS = null;
-            hasAttrName = false;
-
-            reset(attrValue);
-            attrValueS = null;
-            hasAttrValue = false;
-            hasEmptyAttrValue = false;
+            resetPendingAttr();
+        }
+
+        private void trackAttributeRange(String name) {
+            if (trackSource && isStartTag()) {
+                final StartTag start = asStartTag();
+                final CharacterReader r = start.reader;
+                assert attributes != null;
+                //noinspection unchecked
+                Map<String, Range.AttributeRange> attrRanges =
+                    (Map<String, Range.AttributeRange>) attributes.userData(AttrRangeKey);
+                if (attrRanges == null) {
+                    attrRanges = new HashMap<>();
+                    attributes.userData(AttrRangeKey, attrRanges);
+                }
+                if (attrRanges.containsKey(name)) return; // dedupe ranges on case-sensitive name as we go; actual attributes get deduped later
+
+                // if there's no value (e.g. boolean), make it an implicit range at current
+                if (!hasAttrValue) attrValStart = attrValEnd = attrNameEnd;
+
+                Range.AttributeRange range = new Range.AttributeRange(
+                    new Range(
+                        new Range.Position(attrNameStart, r.lineNumber(attrNameStart), r.columnNumber(attrNameStart)),
+                        new Range.Position(attrNameEnd, r.lineNumber(attrNameEnd), r.columnNumber(attrNameEnd))),
+                    new Range(
+                        new Range.Position(attrValStart, r.lineNumber(attrValStart), r.columnNumber(attrValStart)),
+                        new Range.Position(attrValEnd, r.lineNumber(attrValEnd), r.columnNumber(attrValEnd)))
+                );
+                attrRanges.put(name, range);
+            }
         }
 
         final boolean hasAttributes() {
@@ -225,46 +270,41 @@ final void appendTagName(char append) {
             appendTagName(String.valueOf(append));
         }
 
-        final void appendAttributeName(String append) {
+        final void appendAttributeName(String append, int startPos, int endPos) {
             // might have null chars because we eat in one pass - need to replace with null replacement character
             append = append.replace(TokeniserState.nullChar, Tokeniser.replacementChar);
 
-            ensureAttrName();
-            if (attrName.length() == 0) {
-                attrNameS = append;
+            ensureAttrName(startPos, endPos);
+            if (attrNameSb.length() == 0) {
+                attrName = append;
             } else {
-                attrName.append(append);
+                attrNameSb.append(append);
             }
         }
 
-        final void appendAttributeName(char append) {
-            ensureAttrName();
-            attrName.append(append);
+        final void appendAttributeName(char append, int startPos, int endPos) {
+            ensureAttrName(startPos, endPos);
+            attrNameSb.append(append);
         }
 
-        final void appendAttributeValue(String append) {
-            ensureAttrValue();
-            if (attrValue.length() == 0) {
-                attrValueS = append;
+        final void appendAttributeValue(String append, int startPos, int endPos) {
+            ensureAttrValue(startPos, endPos);
+            if (attrValueSb.length() == 0) {
+                attrValue = append;
             } else {
-                attrValue.append(append);
+                attrValueSb.append(append);
             }
         }
 
-        final void appendAttributeValue(char append) {
-            ensureAttrValue();
-            attrValue.append(append);
-        }
-
-        final void appendAttributeValue(char[] append) {
-            ensureAttrValue();
-            attrValue.append(append);
+        final void appendAttributeValue(char append, int startPos, int endPos) {
+            ensureAttrValue(startPos, endPos);
+            attrValueSb.append(append);
         }
 
-        final void appendAttributeValue(int[] appendCodepoints) {
-            ensureAttrValue();
+        final void appendAttributeValue(int[] appendCodepoints, int startPos, int endPos) {
+            ensureAttrValue(startPos, endPos);
             for (int codepoint : appendCodepoints) {
-                attrValue.appendCodePoint(codepoint);
+                attrValueSb.appendCodePoint(codepoint);
             }
         }
         
@@ -272,21 +312,29 @@ final void setEmptyAttributeValue() {
             hasEmptyAttrValue = true;
         }
 
-        private void ensureAttrName() {
+        private void ensureAttrName(int startPos, int endPos) {
             hasAttrName = true;
             // if on second hit, we'll need to move to the builder
-            if (attrNameS != null) {
-                attrName.append(attrNameS);
-                attrNameS = null;
+            if (attrName != null) {
+                attrNameSb.append(attrName);
+                attrName = null;
+            }
+            if (trackSource) {
+                attrNameStart = attrNameStart > Unset ? attrNameStart : startPos; // latches to first
+                attrNameEnd = endPos;
             }
         }
 
-        private void ensureAttrValue() {
+        private void ensureAttrValue(int startPos, int endPos) {
             hasAttrValue = true;
             // if on second hit, we'll need to move to the builder
-            if (attrValueS != null) {
-                attrValue.append(attrValueS);
-                attrValueS = null;
+            if (attrValue != null) {
+                attrValueSb.append(attrValue);
+                attrValue = null;
+            }
+            if (trackSource) {
+                attrValStart = attrValStart > Unset ? attrValStart : startPos; // latches to first
+                attrValEnd = endPos;
             }
         }
 
@@ -295,9 +343,13 @@ private void ensureAttrValue() {
     }
 
     final static class StartTag extends Tag {
-        StartTag() {
-            super();
+        final CharacterReader reader;
+
+        // Reader is provided so if tracking, can get line / column positions for Range.
+        StartTag(boolean trackSource, CharacterReader reader) {
+            super(trackSource);
             type = TokenType.StartTag;
+            this.reader = reader;
         }
 
         @Override
@@ -326,7 +378,7 @@ public String toString() {
 
     final static class EndTag extends Tag{
         EndTag() {
-            super();
+            super(false);
             type = TokenType.EndTag;
         }
 
@@ -358,7 +410,7 @@ String getData() {
             return dataS != null ? dataS : data.toString();
         }
 
-        final Comment append(String append) {
+        Comment append(String append) {
             ensureData();
             if (data.length() == 0) {
                 dataS = append;
@@ -368,7 +420,7 @@ final Comment append(String append) {
             return this;
         }
 
-        final Comment append(char append) {
+        Comment append(char append) {
             ensureData();
             data.append(append);
             return this;
diff --git a/src/main/java/org/jsoup/parser/Tokeniser.java b/src/main/java/org/jsoup/parser/Tokeniser.java
index be00b7f63c..e76ba0d741 100644
--- a/src/main/java/org/jsoup/parser/Tokeniser.java
+++ b/src/main/java/org/jsoup/parser/Tokeniser.java
@@ -3,8 +3,8 @@
 import org.jsoup.helper.Validate;
 import org.jsoup.internal.StringUtil;
 import org.jsoup.nodes.Entities;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.util.Arrays;
 
 /**
@@ -38,21 +38,22 @@ final class Tokeniser {
     private boolean isEmitPending = false;
     @Nullable private String charsString = null; // characters pending an emit. Will fall to charsBuilder if more than one
     private final StringBuilder charsBuilder = new StringBuilder(1024); // buffers characters to output as one token, if more than one emit per read
-    StringBuilder dataBuffer = new StringBuilder(1024); // buffers data looking for </script>
-
-    Token.StartTag startPending = new Token.StartTag();
-    Token.EndTag endPending = new Token.EndTag();
-    Token.Tag tagPending = startPending; // tag we are building up: start or end pending
-    Token.Character charPending = new Token.Character();
-    Token.Doctype doctypePending = new Token.Doctype(); // doctype building up
-    Token.Comment commentPending = new Token.Comment(); // comment building up
+    final StringBuilder dataBuffer = new StringBuilder(1024); // buffers data looking for </script>
+
+    final Token.StartTag startPending;
+    final Token.EndTag endPending = new Token.EndTag();
+    Token.Tag tagPending; // tag we are building up: start or end pending
+    final Token.Character charPending = new Token.Character();
+    final Token.Doctype doctypePending = new Token.Doctype(); // doctype building up
+    final Token.Comment commentPending = new Token.Comment(); // comment building up
     @Nullable private String lastStartTag; // the last start tag emitted, to test appropriate end tag
     @Nullable private String lastStartCloseSeq; // "</" + lastStartTag, so we can quickly check for that in RCData
 
     private static final int Unset = -1;
     private int markupStartPos, charStartPos = Unset; // reader pos at the start of markup / characters. updated on state transition
 
-    Tokeniser(CharacterReader reader, ParseErrorList errors) {
+    Tokeniser(CharacterReader reader, ParseErrorList errors, boolean trackSource) {
+        tagPending = startPending  = new Token.StartTag(trackSource, reader);
         this.reader = reader;
         this.errors = errors;
     }
@@ -329,7 +330,7 @@ void error(String errorMsg, Object... args) {
             errors.add(new ParseError(reader, errorMsg, args));
     }
 
-    boolean currentNodeInHtmlNS() {
+    static boolean currentNodeInHtmlNS() {
         // todo: implement namespaces correctly
         return true;
         // Element currentNode = currentNode();
diff --git a/src/main/java/org/jsoup/parser/TokeniserState.java b/src/main/java/org/jsoup/parser/TokeniserState.java
index f269fc626c..081b1525fb 100644
--- a/src/main/java/org/jsoup/parser/TokeniserState.java
+++ b/src/main/java/org/jsoup/parser/TokeniserState.java
@@ -8,7 +8,7 @@
 enum TokeniserState {
     Data {
         // in data state, gather characters until a character reference or tag is found
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             switch (r.current()) {
                 case '&':
                     t.advanceTransition(CharacterReferenceInData);
@@ -32,13 +32,13 @@ void read(Tokeniser t, CharacterReader r) {
     },
     CharacterReferenceInData {
         // from & in data
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             readCharRef(t, Data);
         }
     },
     Rcdata {
         /// handles data in title, textarea etc
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             switch (r.current()) {
                 case '&':
                     t.advanceTransition(CharacterReferenceInRcdata);
@@ -62,22 +62,22 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CharacterReferenceInRcdata {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             readCharRef(t, Rcdata);
         }
     },
     Rawtext {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             readRawData(t, r, this, RawtextLessthanSign);
         }
     },
     ScriptData {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             readRawData(t, r, this, ScriptDataLessthanSign);
         }
     },
     PLAINTEXT {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             switch (r.current()) {
                 case nullChar:
                     t.error(this);
@@ -96,7 +96,7 @@ void read(Tokeniser t, CharacterReader r) {
     },
     TagOpen {
         // from < in data
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             switch (r.current()) {
                 case '!':
                     t.advanceTransition(MarkupDeclarationOpen);
@@ -122,7 +122,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     EndTagOpen {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.isEmpty()) {
                 t.eofError(this);
                 t.emit("</");
@@ -143,7 +143,7 @@ void read(Tokeniser t, CharacterReader r) {
     },
     TagName {
         // from < or </ in data, will have start or end tag pending
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             // previous TagOpen state did NOT consume, will have a letter char in current
             String tagName = r.consumeTagName();
             t.tagPending.appendTagName(tagName);
@@ -182,7 +182,7 @@ void read(Tokeniser t, CharacterReader r) {
     },
     RcdataLessthanSign {
         // from < in rcdata
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matches('/')) {
                 t.createTempBuffer();
                 t.advanceTransition(RCDATAEndTagOpen);
@@ -199,7 +199,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     RCDATAEndTagOpen {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchesAsciiAlpha()) {
                 t.createTagPending(false);
                 t.tagPending.appendTagName(r.current());
@@ -212,7 +212,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     RCDATAEndTagName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchesAsciiAlpha()) {
                 String name = r.consumeLetterSequence();
                 t.tagPending.appendTagName(name);
@@ -259,7 +259,7 @@ private void anythingElse(Tokeniser t, CharacterReader r) {
         }
     },
     RawtextLessthanSign {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matches('/')) {
                 t.createTempBuffer();
                 t.advanceTransition(RawtextEndTagOpen);
@@ -270,17 +270,17 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     RawtextEndTagOpen {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             readEndTag(t, r, RawtextEndTagName, Rawtext);
         }
     },
     RawtextEndTagName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             handleDataEndTag(t, r, Rawtext);
         }
     },
     ScriptDataLessthanSign {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             switch (r.consume()) {
                 case '/':
                     t.createTempBuffer();
@@ -303,17 +303,17 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEndTagOpen {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             readEndTag(t, r, ScriptDataEndTagName, ScriptData);
         }
     },
     ScriptDataEndTagName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             handleDataEndTag(t, r, ScriptData);
         }
     },
     ScriptDataEscapeStart {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matches('-')) {
                 t.emit('-');
                 t.advanceTransition(ScriptDataEscapeStartDash);
@@ -323,7 +323,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscapeStartDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matches('-')) {
                 t.emit('-');
                 t.advanceTransition(ScriptDataEscapedDashDash);
@@ -333,7 +333,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscaped {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.isEmpty()) {
                 t.eofError(this);
                 t.transition(Data);
@@ -360,7 +360,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscapedDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.isEmpty()) {
                 t.eofError(this);
                 t.transition(Data);
@@ -388,7 +388,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscapedDashDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.isEmpty()) {
                 t.eofError(this);
                 t.transition(Data);
@@ -419,7 +419,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscapedLessthanSign {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchesAsciiAlpha()) {
                 t.createTempBuffer();
                 t.dataBuffer.append(r.current());
@@ -436,7 +436,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscapedEndTagOpen {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchesAsciiAlpha()) {
                 t.createTagPending(false);
                 t.tagPending.appendTagName(r.current());
@@ -449,17 +449,17 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataEscapedEndTagName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             handleDataEndTag(t, r, ScriptDataEscaped);
         }
     },
     ScriptDataDoubleEscapeStart {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             handleDataDoubleEscapeTag(t, r, ScriptDataDoubleEscaped, ScriptDataEscaped);
         }
     },
     ScriptDataDoubleEscaped {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.current();
             switch (c) {
                 case '-':
@@ -486,7 +486,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataDoubleEscapedDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '-':
@@ -513,7 +513,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataDoubleEscapedDashDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '-':
@@ -543,7 +543,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataDoubleEscapedLessthanSign {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matches('/')) {
                 t.emit('/');
                 t.createTempBuffer();
@@ -554,13 +554,13 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     ScriptDataDoubleEscapeEnd {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             handleDataDoubleEscapeTag(t,r, ScriptDataEscaped, ScriptDataDoubleEscaped);
         }
     },
     BeforeAttributeName {
         // from tagname <xxx
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -595,7 +595,7 @@ void read(Tokeniser t, CharacterReader r) {
                 case '=':
                     t.error(this);
                     t.tagPending.newAttribute();
-                    t.tagPending.appendAttributeName(c);
+                    t.tagPending.appendAttributeName(c, r.pos()-1, r.pos());
                     t.transition(AttributeName);
                     break;
                 default: // A-Z, anything else
@@ -607,10 +607,12 @@ void read(Tokeniser t, CharacterReader r) {
     },
     AttributeName {
         // from before attribute name
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
+            int pos = r.pos();
             String name = r.consumeToAnySorted(attributeNameCharsSorted); // spec deviate - consume and emit nulls in one hit vs stepping
-            t.tagPending.appendAttributeName(name);
+            t.tagPending.appendAttributeName(name, pos, r.pos());
 
+            pos = r.pos();
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -638,15 +640,15 @@ void read(Tokeniser t, CharacterReader r) {
                 case '\'':
                 case '<':
                     t.error(this);
-                    t.tagPending.appendAttributeName(c);
+                    t.tagPending.appendAttributeName(c, pos, r.pos());
                     break;
                 default: // buffer underrun
-                    t.tagPending.appendAttributeName(c);
+                    t.tagPending.appendAttributeName(c, pos, r.pos());
             }
         }
     },
     AfterAttributeName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -668,7 +670,7 @@ void read(Tokeniser t, CharacterReader r) {
                     break;
                 case nullChar:
                     t.error(this);
-                    t.tagPending.appendAttributeName(replacementChar);
+                    t.tagPending.appendAttributeName(replacementChar, r.pos()-1, r.pos());
                     t.transition(AttributeName);
                     break;
                 case eof:
@@ -680,7 +682,7 @@ void read(Tokeniser t, CharacterReader r) {
                 case '<':
                     t.error(this);
                     t.tagPending.newAttribute();
-                    t.tagPending.appendAttributeName(c);
+                    t.tagPending.appendAttributeName(c, r.pos()-1, r.pos());
                     t.transition(AttributeName);
                     break;
                 default: // A-Z, anything else
@@ -691,7 +693,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BeforeAttributeValue {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -713,7 +715,7 @@ void read(Tokeniser t, CharacterReader r) {
                     break;
                 case nullChar:
                     t.error(this);
-                    t.tagPending.appendAttributeValue(replacementChar);
+                    t.tagPending.appendAttributeValue(replacementChar, r.pos()-1, r.pos());
                     t.transition(AttributeValue_unquoted);
                     break;
                 case eof:
@@ -730,7 +732,7 @@ void read(Tokeniser t, CharacterReader r) {
                 case '=':
                 case '`':
                     t.error(this);
-                    t.tagPending.appendAttributeValue(c);
+                    t.tagPending.appendAttributeValue(c, r.pos()-1, r.pos());
                     t.transition(AttributeValue_unquoted);
                     break;
                 default:
@@ -740,13 +742,15 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     AttributeValue_doubleQuoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
+            int pos = r.pos();
             String value = r.consumeAttributeQuoted(false);
             if (value.length() > 0)
-                t.tagPending.appendAttributeValue(value);
+                t.tagPending.appendAttributeValue(value, pos, r.pos());
             else
                 t.tagPending.setEmptyAttributeValue();
 
+            pos = r.pos();
             char c = r.consume();
             switch (c) {
                 case '"':
@@ -755,31 +759,33 @@ void read(Tokeniser t, CharacterReader r) {
                 case '&':
                     int[] ref = t.consumeCharacterReference('"', true);
                     if (ref != null)
-                        t.tagPending.appendAttributeValue(ref);
+                        t.tagPending.appendAttributeValue(ref, pos, r.pos());
                     else
-                        t.tagPending.appendAttributeValue('&');
+                        t.tagPending.appendAttributeValue('&', pos, r.pos());
                     break;
                 case nullChar:
                     t.error(this);
-                    t.tagPending.appendAttributeValue(replacementChar);
+                    t.tagPending.appendAttributeValue(replacementChar, pos, r.pos());
                     break;
                 case eof:
                     t.eofError(this);
                     t.transition(Data);
                     break;
                 default: // hit end of buffer in first read, still in attribute
-                    t.tagPending.appendAttributeValue(c);
+                    t.tagPending.appendAttributeValue(c, pos, r.pos());
             }
         }
     },
     AttributeValue_singleQuoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
+            int pos = r.pos();
             String value = r.consumeAttributeQuoted(true);
             if (value.length() > 0)
-                t.tagPending.appendAttributeValue(value);
+                t.tagPending.appendAttributeValue(value, pos, r.pos());
             else
                 t.tagPending.setEmptyAttributeValue();
 
+            pos = r.pos();
             char c = r.consume();
             switch (c) {
                 case '\'':
@@ -788,29 +794,31 @@ void read(Tokeniser t, CharacterReader r) {
                 case '&':
                     int[] ref = t.consumeCharacterReference('\'', true);
                     if (ref != null)
-                        t.tagPending.appendAttributeValue(ref);
+                        t.tagPending.appendAttributeValue(ref, pos, r.pos());
                     else
-                        t.tagPending.appendAttributeValue('&');
+                        t.tagPending.appendAttributeValue('&', pos, r.pos());
                     break;
                 case nullChar:
                     t.error(this);
-                    t.tagPending.appendAttributeValue(replacementChar);
+                    t.tagPending.appendAttributeValue(replacementChar, pos, r.pos());
                     break;
                 case eof:
                     t.eofError(this);
                     t.transition(Data);
                     break;
                 default: // hit end of buffer in first read, still in attribute
-                    t.tagPending.appendAttributeValue(c);
+                    t.tagPending.appendAttributeValue(c, pos, r.pos());
             }
         }
     },
     AttributeValue_unquoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
+            int pos = r.pos();
             String value = r.consumeToAnySorted(attributeValueUnquoted);
             if (value.length() > 0)
-                t.tagPending.appendAttributeValue(value);
+                t.tagPending.appendAttributeValue(value, pos, r.pos());
 
+            pos = r.pos();
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -823,9 +831,9 @@ void read(Tokeniser t, CharacterReader r) {
                 case '&':
                     int[] ref = t.consumeCharacterReference('>', true);
                     if (ref != null)
-                        t.tagPending.appendAttributeValue(ref);
+                        t.tagPending.appendAttributeValue(ref, pos, r.pos());
                     else
-                        t.tagPending.appendAttributeValue('&');
+                        t.tagPending.appendAttributeValue('&', pos, r.pos());
                     break;
                 case '>':
                     t.emitTagPending();
@@ -833,7 +841,7 @@ void read(Tokeniser t, CharacterReader r) {
                     break;
                 case nullChar:
                     t.error(this);
-                    t.tagPending.appendAttributeValue(replacementChar);
+                    t.tagPending.appendAttributeValue(replacementChar, pos, r.pos());
                     break;
                 case eof:
                     t.eofError(this);
@@ -845,17 +853,17 @@ void read(Tokeniser t, CharacterReader r) {
                 case '=':
                 case '`':
                     t.error(this);
-                    t.tagPending.appendAttributeValue(c);
+                    t.tagPending.appendAttributeValue(c, pos, r.pos());
                     break;
                 default: // hit end of buffer in first read, still in attribute
-                    t.tagPending.appendAttributeValue(c);
+                    t.tagPending.appendAttributeValue(c, pos, r.pos());
             }
 
         }
     },
     // CharacterReferenceInAttributeValue state handled inline
     AfterAttributeValue_quoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -885,7 +893,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     SelfClosingStartTag {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '>':
@@ -905,7 +913,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BogusComment {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             // todo: handle bogus comment starting from eof. when does that trigger?
             t.commentPending.append(r.consumeTo('>'));
             // todo: replace nullChar with replaceChar
@@ -918,7 +926,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     MarkupDeclarationOpen {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchConsume("--")) {
                 t.createCommentPending();
                 t.transition(CommentStart);
@@ -938,7 +946,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CommentStart {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '-':
@@ -966,7 +974,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CommentStartDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '-':
@@ -994,7 +1002,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     Comment {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.current();
             switch (c) {
                 case '-':
@@ -1016,7 +1024,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CommentEndDash {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '-':
@@ -1039,7 +1047,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CommentEnd {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '>':
@@ -1069,7 +1077,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CommentEndBang {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '-':
@@ -1097,7 +1105,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     Doctype {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1124,7 +1132,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BeforeDoctypeName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchesAsciiAlpha()) {
                 t.createDoctypePending();
                 t.transition(DoctypeName);
@@ -1159,7 +1167,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     DoctypeName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.matchesLetter()) {
                 String name = r.consumeLetterSequence();
                 t.doctypePending.name.append(name);
@@ -1194,7 +1202,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     AfterDoctypeName {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             if (r.isEmpty()) {
                 t.eofError(this);
                 t.doctypePending.forceQuirks = true;
@@ -1222,7 +1230,7 @@ else if (r.matches('>')) {
         }
     },
     AfterDoctypePublicKeyword {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1262,7 +1270,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BeforeDoctypePublicIdentifier {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1299,7 +1307,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     DoctypePublicIdentifier_doubleQuoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '"':
@@ -1327,7 +1335,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     DoctypePublicIdentifier_singleQuoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\'':
@@ -1355,7 +1363,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     AfterDoctypePublicIdentifier {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1393,7 +1401,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BetweenDoctypePublicAndSystemIdentifiers {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1430,7 +1438,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     AfterDoctypeSystemKeyword {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1470,7 +1478,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BeforeDoctypeSystemIdentifier {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1507,7 +1515,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     DoctypeSystemIdentifier_doubleQuoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '"':
@@ -1535,7 +1543,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     DoctypeSystemIdentifier_singleQuoted {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\'':
@@ -1563,7 +1571,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     AfterDoctypeSystemIdentifier {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '\t':
@@ -1590,7 +1598,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     BogusDoctype {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             char c = r.consume();
             switch (c) {
                 case '>':
@@ -1608,7 +1616,7 @@ void read(Tokeniser t, CharacterReader r) {
         }
     },
     CdataSection {
-        void read(Tokeniser t, CharacterReader r) {
+        @Override void read(Tokeniser t, CharacterReader r) {
             String data = r.consumeTo("]]>");
             t.dataBuffer.append(data);
             if (r.matchConsume("]]>") || r.isEmpty()) {
diff --git a/src/main/java/org/jsoup/parser/TreeBuilder.java b/src/main/java/org/jsoup/parser/TreeBuilder.java
index 6c9a78b5bc..eadfa28447 100644
--- a/src/main/java/org/jsoup/parser/TreeBuilder.java
+++ b/src/main/java/org/jsoup/parser/TreeBuilder.java
@@ -1,14 +1,13 @@
 package org.jsoup.parser;
 
 import org.jsoup.helper.Validate;
+import org.jsoup.internal.SharedConstants;
 import org.jsoup.nodes.Attributes;
 import org.jsoup.nodes.Document;
 import org.jsoup.nodes.Element;
 import org.jsoup.nodes.Node;
 import org.jsoup.nodes.Range;
 
-import javax.annotation.Nullable;
-import javax.annotation.ParametersAreNonnullByDefault;
 import java.io.Reader;
 import java.util.ArrayList;
 import java.util.HashMap;
@@ -24,21 +23,20 @@ abstract class TreeBuilder {
     protected Parser parser;
     CharacterReader reader;
     Tokeniser tokeniser;
-    protected Document doc; // current doc we are building into
-    protected ArrayList<Element> stack; // the stack of open elements
-    protected String baseUri; // current base uri, for creating new elements
-    protected Token currentToken; // currentToken is used only for error tracking.
-    protected ParseSettings settings;
-    protected Map<String, Tag> seenTags; // tags we've used in this parse; saves tag GC for custom tags.
-
-    private Token.StartTag start = new Token.StartTag(); // start tag to process
-    private Token.EndTag end  = new Token.EndTag();
+    Document doc; // current doc we are building into
+    ArrayList<Element> stack; // the stack of open elements
+    String baseUri; // current base uri, for creating new elements
+    Token currentToken; // currentToken is used only for error tracking.
+    ParseSettings settings;
+    Map<String, Tag> seenTags; // tags we've used in this parse; saves tag GC for custom tags.
+
+    private Token.StartTag start; // start tag to process
+    private final Token.EndTag end  = new Token.EndTag();
     abstract ParseSettings defaultSettings();
 
     private boolean trackSourceRange;  // optionally tracks the source range of nodes
 
-    @ParametersAreNonnullByDefault
-    protected void initialiseParse(Reader input, String baseUri, Parser parser) {
+    void initialiseParse(Reader input, String baseUri, Parser parser) {
         Validate.notNullParam(input, "input");
         Validate.notNullParam(baseUri, "baseUri");
         Validate.notNull(parser);
@@ -51,13 +49,13 @@ protected void initialiseParse(Reader input, String baseUri, Parser parser) {
         trackSourceRange = parser.isTrackPosition();
         reader.trackNewlines(parser.isTrackErrors() || trackSourceRange); // when tracking errors or source ranges, enable newline tracking for better legibility
         currentToken = null;
-        tokeniser = new Tokeniser(reader, parser.getErrors());
+        tokeniser = new Tokeniser(reader, parser.getErrors(), trackSourceRange);
         stack = new ArrayList<>(32);
         seenTags = new HashMap<>();
+        start = new Token.StartTag(trackSourceRange, reader);
         this.baseUri = baseUri;
     }
 
-    @ParametersAreNonnullByDefault
     Document parse(Reader input, String baseUri, Parser parser) {
         initialiseParse(input, baseUri, parser);
         runParser();
@@ -80,55 +78,77 @@ Document parse(Reader input, String baseUri, Parser parser) {
 
     abstract List<Node> parseFragment(String inputFragment, Element context, String baseUri, Parser parser);
 
-    protected void runParser() {
+    void runParser() {
         final Tokeniser tokeniser = this.tokeniser;
         final Token.TokenType eof = Token.TokenType.EOF;
 
         while (true) {
             Token token = tokeniser.read();
+            currentToken = token;
             process(token);
-            token.reset();
-
             if (token.type == eof)
                 break;
+            token.reset();
         }
+
+        // once we hit the end, pop remaining items off the stack
+        while (!stack.isEmpty()) pop();
     }
 
-    protected abstract boolean process(Token token);
+    abstract boolean process(Token token);
 
-    protected boolean processStartTag(String name) {
+    boolean processStartTag(String name) {
         // these are "virtual" start tags (auto-created by the treebuilder), so not tracking the start position
         final Token.StartTag start = this.start;
         if (currentToken == start) { // don't recycle an in-use token
-            return process(new Token.StartTag().name(name));
+            return process(new Token.StartTag(trackSourceRange, reader).name(name));
         }
         return process(start.reset().name(name));
     }
 
-    public boolean processStartTag(String name, Attributes attrs) {
+    boolean processStartTag(String name, Attributes attrs) {
         final Token.StartTag start = this.start;
         if (currentToken == start) { // don't recycle an in-use token
-            return process(new Token.StartTag().nameAttr(name, attrs));
+            return process(new Token.StartTag(trackSourceRange, reader).nameAttr(name, attrs));
         }
         start.reset();
         start.nameAttr(name, attrs);
         return process(start);
     }
 
-    protected boolean processEndTag(String name) {
+    boolean processEndTag(String name) {
         if (currentToken == end) { // don't recycle an in-use token
             return process(new Token.EndTag().name(name));
         }
         return process(end.reset().name(name));
     }
 
+    /**
+     Removes the last Element from the stack, hits onNodeClosed, and then returns it.
+     * @return
+     */
+    final Element pop() {
+        int size = stack.size();
+        Element removed = stack.remove(size - 1);
+        onNodeClosed(removed);
+        return removed;
+    }
+
+    /**
+     Adds the specified Element to the end of the stack, and hits onNodeInserted.
+     * @param element
+     */
+    final void push(Element element) {
+        stack.add(element);
+        onNodeInserted(element);
+    }
 
     /**
      Get the current element (last on the stack). If all items have been removed, returns the document instead
      (which might not actually be on the stack; use stack.size() == 0 to test if required.
      @return the last element on the stack, if any; or the root document
      */
-    protected Element currentElement() {
+    Element currentElement() {
         int size = stack.size();
         return size > 0 ? stack.get(size-1) : doc;
     }
@@ -138,7 +158,7 @@ protected Element currentElement() {
      @param normalName name to check
      @return true if there is a current element on the stack, and its name equals the supplied
      */
-    protected boolean currentElementIs(String normalName) {
+    boolean currentElementIs(String normalName) {
         if (stack.size() == 0)
             return false;
         Element current = currentElement();
@@ -152,7 +172,7 @@ protected boolean currentElementIs(String normalName) {
      @param namespace the namespace
      @return true if there is a current element on the stack, and its name equals the supplied
      */
-    protected boolean currentElementIs(String normalName, String namespace) {
+    boolean currentElementIs(String normalName, String namespace) {
         if (stack.size() == 0)
             return false;
         Element current = currentElement();
@@ -164,7 +184,7 @@ protected boolean currentElementIs(String normalName, String namespace) {
      * If the parser is tracking errors, add an error at the current position.
      * @param msg error message
      */
-    protected void error(String msg) {
+    void error(String msg) {
         error(msg, (Object[]) null);
     }
 
@@ -173,7 +193,7 @@ protected void error(String msg) {
      * @param msg error message template
      * @param args template arguments
      */
-    protected void error(String msg, Object... args) {
+    void error(String msg, Object... args) {
         ParseErrorList errors = parser.getErrors();
         if (errors.canAddError())
             errors.add(new ParseError(reader, msg, args));
@@ -183,11 +203,11 @@ protected void error(String msg, Object... args) {
      (An internal method, visible for Element. For HTML parse, signals that script and style text should be treated as
      Data Nodes).
      */
-    protected boolean isContentForTagData(String normalName) {
+    boolean isContentForTagData(String normalName) {
         return false;
     }
 
-    protected Tag tagFor(String tagName, String namespace, ParseSettings settings) {
+    Tag tagFor(String tagName, String namespace, ParseSettings settings) {
         Tag cached = seenTags.get(tagName); // note that we don't normalize the cache key. But tag via valueOf may be normalized.
         if (cached == null || !cached.namespace().equals(namespace)) {
             // only return from cache if the namespace is the same. not running nested cache to save double hit on the common flow
@@ -198,7 +218,7 @@ protected Tag tagFor(String tagName, String namespace, ParseSettings settings) {
         return cached;
     }
 
-    protected Tag tagFor(String tagName, ParseSettings settings) {
+    Tag tagFor(String tagName, ParseSettings settings) {
         return tagFor(tagName, defaultNamespace(), settings);
     }
 
@@ -206,40 +226,58 @@ protected Tag tagFor(String tagName, ParseSettings settings) {
      Gets the default namespace for this TreeBuilder
      * @return the default namespace
      */
-    protected String defaultNamespace() {
+    String defaultNamespace() {
         return NamespaceHtml;
     }
 
     /**
      Called by implementing TreeBuilders when a node has been inserted. This implementation includes optionally tracking
-     the source range of the node.
-     * @param node the node that was just inserted
-     * @param token the (optional) token that created this node
+     the source range of the node.  @param node the node that was just inserted
      */
-    protected void onNodeInserted(Node node, @Nullable Token token) {
-        trackNodePosition(node, token, true);
+    void onNodeInserted(Node node) {
+        trackNodePosition(node, true);
     }
 
     /**
      Called by implementing TreeBuilders when a node is explicitly closed. This implementation includes optionally
-     tracking the closing source range of the node.
-     * @param node the node being closed
-     * @param token the end-tag token that closed this node
+     tracking the closing source range of the node.  @param node the node being closed
      */
-    protected void onNodeClosed(Node node, Token token) {
-        trackNodePosition(node, token, false);
+    void onNodeClosed(Node node) {
+        trackNodePosition(node, false);
     }
 
-    private void trackNodePosition(Node node, @Nullable Token token, boolean start) {
-        if (trackSourceRange && token != null) {
-            int startPos = token.startPos();
-            if (startPos == Token.Unset) return; // untracked, virtual token
-
-            Range.Position startRange = new Range.Position(startPos, reader.lineNumber(startPos), reader.columnNumber(startPos));
-            int endPos = token.endPos();
-            Range.Position endRange = new Range.Position(endPos, reader.lineNumber(endPos), reader.columnNumber(endPos));
-            Range range = new Range(startRange, endRange);
-            range.track(node, start);
+    private void trackNodePosition(Node node, boolean isStart) {
+        if (!trackSourceRange) return;
+
+        final Token token = currentToken;
+        int startPos = token.startPos();
+        int endPos = token.endPos();
+
+        // handle implicit element open / closes.
+        if (node instanceof Element) {
+            final Element el = (Element) node;
+            if (token.isEOF()) {
+                if (el.endSourceRange().isTracked())
+                    return; // /body and /html are left on stack until EOF, don't reset them
+                startPos = endPos = reader.pos();
+            } else if (isStart) { // opening tag
+                if  (!token.isStartTag() || !el.normalName().equals(token.asStartTag().normalName)) {
+                    endPos = startPos;
+                }
+            } else { // closing tag
+                if (!el.tag().isEmpty() && !el.tag().isSelfClosing()) {
+                    if (!token.isEndTag() || !el.normalName().equals(token.asEndTag().normalName)) {
+                        endPos = startPos;
+                    }
+                }
+            }
         }
+
+        Range.Position startPosition = new Range.Position
+            (startPos, reader.lineNumber(startPos), reader.columnNumber(startPos));
+        Range.Position endPosition = new Range.Position
+            (endPos, reader.lineNumber(endPos), reader.columnNumber(endPos));
+        Range range = new Range(startPosition, endPosition);
+        node.attributes().userData(isStart ? SharedConstants.RangeKey : SharedConstants.EndRangeKey, range);
     }
 }
diff --git a/src/main/java/org/jsoup/parser/XmlTreeBuilder.java b/src/main/java/org/jsoup/parser/XmlTreeBuilder.java
index e1999f9679..8ef653eee3 100644
--- a/src/main/java/org/jsoup/parser/XmlTreeBuilder.java
+++ b/src/main/java/org/jsoup/parser/XmlTreeBuilder.java
@@ -7,11 +7,11 @@
 import org.jsoup.nodes.DocumentType;
 import org.jsoup.nodes.Element;
 import org.jsoup.nodes.Entities;
+import org.jsoup.nodes.LeafNode;
 import org.jsoup.nodes.Node;
 import org.jsoup.nodes.TextNode;
 import org.jsoup.nodes.XmlDeclaration;
 
-import javax.annotation.ParametersAreNonnullByDefault;
 import java.io.Reader;
 import java.io.StringReader;
 import java.util.List;
@@ -26,14 +26,14 @@
  * @author Jonathan Hedley
  */
 public class XmlTreeBuilder extends TreeBuilder {
-    ParseSettings defaultSettings() {
+    @Override ParseSettings defaultSettings() {
         return ParseSettings.preserveCase;
     }
 
-    @Override @ParametersAreNonnullByDefault
+    @Override
     protected void initialiseParse(Reader input, String baseUri, Parser parser) {
         super.initialiseParse(input, baseUri, parser);
-        stack.add(doc); // place the document onto the stack. differs from HtmlTreeBuilder (not on stack)
+        stack.add(doc); // place the document onto the stack. differs from HtmlTreeBuilder (not on stack). Note not push()ed, so not onNodeInserted.
         doc.outputSettings()
             .syntax(Document.OutputSettings.Syntax.xml)
             .escapeMode(Entities.EscapeMode.xhtml)
@@ -59,22 +59,24 @@ XmlTreeBuilder newInstance() {
 
     @Override
     protected boolean process(Token token) {
+        currentToken = token;
+
         // start tag, end tag, doctype, comment, character, eof
         switch (token.type) {
             case StartTag:
-                insert(token.asStartTag());
+                insertElementFor(token.asStartTag());
                 break;
             case EndTag:
                 popStackToClose(token.asEndTag());
                 break;
             case Comment:
-                insert(token.asComment());
+                insertCommentFor(token.asComment());
                 break;
             case Character:
-                insert(token.asCharacter());
+                insertCharacterFor(token.asCharacter());
                 break;
             case Doctype:
-                insert(token.asDoctype());
+                insertDoctypeFor(token.asDoctype());
                 break;
             case EOF: // could put some normalisation here if desired
                 break;
@@ -84,53 +86,63 @@ protected boolean process(Token token) {
         return true;
     }
 
-    protected void insertNode(Node node) {
-        currentElement().appendChild(node);
-        onNodeInserted(node, null);
-    }
-
-    protected void insertNode(Node node, Token token) {
-        currentElement().appendChild(node);
-        onNodeInserted(node, token);
-    }
-
-    Element insert(Token.StartTag startTag) {
+    void insertElementFor(Token.StartTag startTag) {
         Tag tag = tagFor(startTag.name(), settings);
-        if (startTag.hasAttributes())
+        if (startTag.attributes != null)
             startTag.attributes.deduplicate(settings);
 
         Element el = new Element(tag, null, settings.normalizeAttributes(startTag.attributes));
-        insertNode(el, startTag);
+        currentElement().appendChild(el);
+        push(el);
+
         if (startTag.isSelfClosing()) {
             tag.setSelfClosing();
-        } else {
-            stack.add(el);
+            pop(); // push & pop ensures onNodeInserted & onNodeClosed
         }
-        return el;
     }
 
-    void insert(Token.Comment commentToken) {
+    void insertLeafNode(LeafNode node) {
+        currentElement().appendChild(node);
+        onNodeInserted(node);
+    }
+
+    void insertCommentFor(Token.Comment commentToken) {
         Comment comment = new Comment(commentToken.getData());
-        Node insert = comment;
+        LeafNode insert = comment;
         if (commentToken.bogus && comment.isXmlDeclaration()) {
             // xml declarations are emitted as bogus comments (which is right for html, but not xml)
             // so we do a bit of a hack and parse the data as an element to pull the attributes out
+            // todo - refactor this to parse more appropriately
             XmlDeclaration decl = comment.asXmlDeclaration(); // else, we couldn't parse it as a decl, so leave as a comment
             if (decl != null)
                 insert = decl;
         }
-        insertNode(insert, commentToken);
+        insertLeafNode(insert);
     }
 
-    void insert(Token.Character token) {
+    void insertCharacterFor(Token.Character token) {
         final String data = token.getData();
-        insertNode(token.isCData() ? new CDataNode(data) : new TextNode(data), token);
+        insertLeafNode(token.isCData() ? new CDataNode(data) : new TextNode(data));
+    }
+
+    void insertDoctypeFor(Token.Doctype token) {
+        DocumentType doctypeNode = new DocumentType(settings.normalizeTag(token.getName()), token.getPublicIdentifier(), token.getSystemIdentifier());
+        doctypeNode.setPubSysKey(token.getPubSysKey());
+        insertLeafNode(doctypeNode);
+    }
+
+    /** @deprecated unused and will be removed. */
+    @Deprecated
+    protected void insertNode(Node node) {
+        currentElement().appendChild(node);
+        onNodeInserted(node);
     }
 
-    void insert(Token.Doctype d) {
-        DocumentType doctypeNode = new DocumentType(settings.normalizeTag(d.getName()), d.getPublicIdentifier(), d.getSystemIdentifier());
-        doctypeNode.setPubSysKey(d.getPubSysKey());
-        insertNode(doctypeNode, d);
+    /** @deprecated unused and will be removed. */
+    @Deprecated
+    protected void insertNode(Node node, Token token) {
+        currentElement().appendChild(node);
+        onNodeInserted(node);
     }
 
     /**
@@ -158,25 +170,21 @@ protected void popStackToClose(Token.EndTag endTag) {
             return; // not found, skip
 
         for (int pos = stack.size() -1; pos >= 0; pos--) {
-            Element next = stack.get(pos);
-            stack.remove(pos);
+            Element next = pop();
             if (next == firstFound) {
-                onNodeClosed(next, endTag);
                 break;
             }
         }
     }
     private static final int maxQueueDepth = 256; // an arbitrary tension point between real XML and crafted pain
 
-
-
     List<Node> parseFragment(String inputFragment, String baseUri, Parser parser) {
         initialiseParse(new StringReader(inputFragment), baseUri, parser);
         runParser();
         return doc.childNodes();
     }
 
-    List<Node> parseFragment(String inputFragment, Element context, String baseUri, Parser parser) {
+    @Override List<Node> parseFragment(String inputFragment, Element context, String baseUri, Parser parser) {
         return parseFragment(inputFragment, baseUri, parser);
     }
 }
diff --git a/src/main/java/org/jsoup/parser/package-info.java b/src/main/java/org/jsoup/parser/package-info.java
index f1b3c88741..35d25a5248 100644
--- a/src/main/java/org/jsoup/parser/package-info.java
+++ b/src/main/java/org/jsoup/parser/package-info.java
@@ -1,7 +1,7 @@
 /**
  Contains the HTML parser, tag specifications, and HTML tokeniser.
  */
-@NonnullByDefault
+@NullMarked
 package org.jsoup.parser;
 
-import org.jsoup.internal.NonnullByDefault;
+import org.jspecify.annotations.NullMarked;
diff --git a/src/main/java/org/jsoup/safety/Cleaner.java b/src/main/java/org/jsoup/safety/Cleaner.java
index 7b9317ec29..b84608abac 100644
--- a/src/main/java/org/jsoup/safety/Cleaner.java
+++ b/src/main/java/org/jsoup/safety/Cleaner.java
@@ -9,15 +9,12 @@
 import org.jsoup.nodes.Node;
 import org.jsoup.nodes.TextNode;
 import org.jsoup.parser.ParseErrorList;
-import org.jsoup.parser.ParseSettings;
 import org.jsoup.parser.Parser;
-import org.jsoup.parser.Tag;
 import org.jsoup.select.NodeTraversor;
 import org.jsoup.select.NodeVisitor;
 
 import java.util.List;
 
-
 /**
  The safelist based HTML cleaner. Use to ensure that end-user provided HTML contains only the elements and attributes
  that you are expecting; no junk, and no cross-site scripting attacks!
@@ -137,7 +134,7 @@ private CleaningVisitor(Element root, Element destination) {
             this.destination = destination;
         }
 
-        public void head(Node source, int depth) {
+        @Override public void head(Node source, int depth) {
             if (source instanceof Element) {
                 Element sourceEl = (Element) source;
 
@@ -155,7 +152,7 @@ public void head(Node source, int depth) {
                 TextNode sourceText = (TextNode) source;
                 TextNode destText = new TextNode(sourceText.getWholeText());
                 destination.appendChild(destText);
-            } else if (source instanceof DataNode && safelist.isSafeTag(source.parent().nodeName())) {
+            } else if (source instanceof DataNode && safelist.isSafeTag(source.parent().normalName())) {
               DataNode sourceData = (DataNode) source;
               DataNode destData = new DataNode(sourceData.getWholeData());
               destination.appendChild(destData);
@@ -164,8 +161,8 @@ public void head(Node source, int depth) {
             }
         }
 
-        public void tail(Node source, int depth) {
-            if (source instanceof Element && safelist.isSafeTag(source.nodeName())) {
+        @Override public void tail(Node source, int depth) {
+            if (source instanceof Element && safelist.isSafeTag(source.normalName())) {
                 destination = destination.parent(); // would have descended, so pop destination stack
             }
         }
@@ -178,11 +175,12 @@ private int copySafeNodes(Element source, Element dest) {
     }
 
     private ElementMeta createSafeElement(Element sourceEl) {
+        Element dest = sourceEl.shallowClone(); // reuses tag, clones attributes and preserves any user data
         String sourceTag = sourceEl.tagName();
-        Attributes destAttrs = new Attributes();
-        Element dest = new Element(Tag.valueOf(sourceTag, sourceEl.tag().namespace(), ParseSettings.preserveCase), sourceEl.baseUri(), destAttrs);
-        int numDiscarded = 0;
+        Attributes destAttrs = dest.attributes();
+        dest.clearAttributes(); // clear all non-internal attributes, ready for safe copy
 
+        int numDiscarded = 0;
         Attributes sourceAttrs = sourceEl.attributes();
         for (Attribute sourceAttr : sourceAttrs) {
             if (safelist.isSafeAttribute(sourceTag, sourceEl, sourceAttr))
@@ -192,14 +190,7 @@ private ElementMeta createSafeElement(Element sourceEl) {
         }
         Attributes enforcedAttrs = safelist.getEnforcedAttributes(sourceTag);
         destAttrs.addAll(enforcedAttrs);
-
-        // Copy the original start and end range, if set
-        // TODO - might be good to make a generic Element#userData set type interface, and copy those all over
-        if (sourceEl.sourceRange().isTracked())
-            sourceEl.sourceRange().track(dest, true);
-        if (sourceEl.endSourceRange().isTracked())
-            sourceEl.endSourceRange().track(dest, false);
-
+        dest.attributes().addAll(destAttrs); // re-attach, if removed in clear
         return new ElementMeta(dest, numDiscarded);
     }
 
diff --git a/src/main/java/org/jsoup/safety/Safelist.java b/src/main/java/org/jsoup/safety/Safelist.java
index d1f275df39..eb1281ba6d 100644
--- a/src/main/java/org/jsoup/safety/Safelist.java
+++ b/src/main/java/org/jsoup/safety/Safelist.java
@@ -6,6 +6,7 @@ Thank you to Ryan Grove (wonko.com) for the Ruby HTML cleaner http://github.com/
  */
 
 import org.jsoup.helper.Validate;
+import org.jsoup.internal.Normalizer;
 import org.jsoup.nodes.Attribute;
 import org.jsoup.nodes.Attributes;
 import org.jsoup.nodes.Element;
@@ -52,9 +53,8 @@ If you need to allow more through (please be careful!), tweak a base safelist wi
 
  <p>
  The cleaner and these safelists assume that you want to clean a <code>body</code> fragment of HTML (to add user
- supplied HTML into a templated page), and not to clean a full HTML document. If the latter is the case, either wrap the
- document HTML around the cleaned body HTML, or create a safelist that allows <code>html</code> and <code>head</code>
- elements as appropriate.
+ supplied HTML into a templated page), and not to clean a full HTML document. If the latter is the case, you could wrap
+ the templated document HTML around the cleaned body HTML.
  </p>
  <p>
  If you are going to extend a safelist, please be very careful. Make sure you understand what attributes may lead to
@@ -297,8 +297,8 @@ public Safelist addAttributes(String tag, String... attributes) {
         Validate.notNull(attributes);
         Validate.isTrue(attributes.length > 0, "No attribute names supplied.");
 
+        addTags(tag);
         TagName tagName = TagName.valueOf(tag);
-        tagNames.add(tagName);
         Set<AttributeKey> attributeSet = new HashSet<>();
         for (String key : attributes) {
             Validate.notEmpty(key);
@@ -622,7 +622,7 @@ static class TagName extends TypedValue {
         }
 
         static TagName valueOf(String value) {
-            return new TagName(value);
+            return new TagName(Normalizer.lowerCase(value));
         }
     }
 
@@ -632,7 +632,7 @@ static class AttributeKey extends TypedValue {
         }
 
         static AttributeKey valueOf(String value) {
-            return new AttributeKey(value);
+            return new AttributeKey(Normalizer.lowerCase(value));
         }
     }
 
diff --git a/src/main/java/org/jsoup/safety/package-info.java b/src/main/java/org/jsoup/safety/package-info.java
index 26b4b701bb..11396ebe4d 100644
--- a/src/main/java/org/jsoup/safety/package-info.java
+++ b/src/main/java/org/jsoup/safety/package-info.java
@@ -1,4 +1,7 @@
 /**
  Contains the jsoup HTML cleaner, and safelist definitions.
  */
+@NullMarked
 package org.jsoup.safety;
+
+import org.jspecify.annotations.NullMarked;
\ No newline at end of file
diff --git a/src/main/java/org/jsoup/select/Collector.java b/src/main/java/org/jsoup/select/Collector.java
index 00f384b6b5..02b0528384 100644
--- a/src/main/java/org/jsoup/select/Collector.java
+++ b/src/main/java/org/jsoup/select/Collector.java
@@ -1,12 +1,10 @@
 package org.jsoup.select;
 
 import org.jsoup.nodes.Element;
-import org.jsoup.nodes.Node;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
-
-import static org.jsoup.select.NodeFilter.FilterResult.CONTINUE;
-import static org.jsoup.select.NodeFilter.FilterResult.STOP;
+import java.util.Optional;
+import java.util.stream.Collectors;
 
 /**
  * Collects a list of elements that match the supplied criteria.
@@ -25,15 +23,10 @@ private Collector() {}
      */
     public static Elements collect (Evaluator eval, Element root) {
         eval.reset();
-        Elements elements = new Elements();
-        NodeTraversor.traverse((node, depth) -> {
-            if (node instanceof Element) {
-                Element el = (Element) node;
-                if (eval.matches(root, el))
-                    elements.add(el);
-            }
-        }, root);
-        return elements;
+
+        return root.stream()
+            .filter(eval.asPredicate(root))
+            .collect(Collectors.toCollection(Elements::new));
     }
 
     /**
@@ -45,36 +38,8 @@ public static Elements collect (Evaluator eval, Element root) {
      */
     public static @Nullable Element findFirst(Evaluator eval, Element root) {
         eval.reset();
-        FirstFinder finder = new FirstFinder(eval);
-        return finder.find(root, root);
-    }
-
-    static class FirstFinder implements NodeFilter {
-        private @Nullable Element evalRoot = null;
-        private @Nullable Element match = null;
-        private final Evaluator eval;
-
-        FirstFinder(Evaluator eval) {
-            this.eval = eval;
-        }
-
-        @Nullable Element find(Element root, Element start) {
-            evalRoot = root;
-            match = null;
-            NodeTraversor.filter(this, start);
-            return match;
-        }
 
-        @Override
-        public FilterResult head(Node node, int depth) {
-            if (node instanceof Element) {
-                Element el = (Element) node;
-                if (eval.matches(evalRoot, el)) {
-                    match = el;
-                    return STOP;
-                }
-            }
-            return CONTINUE;
-        }
+        Optional<Element> first = root.stream().filter(eval.asPredicate(root)).findFirst();
+        return first.orElse(null);
     }
 }
diff --git a/src/main/java/org/jsoup/select/CombiningEvaluator.java b/src/main/java/org/jsoup/select/CombiningEvaluator.java
index 3af498e68a..25e5eac2ee 100644
--- a/src/main/java/org/jsoup/select/CombiningEvaluator.java
+++ b/src/main/java/org/jsoup/select/CombiningEvaluator.java
@@ -2,8 +2,8 @@
 
 import org.jsoup.internal.StringUtil;
 import org.jsoup.nodes.Element;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
diff --git a/src/main/java/org/jsoup/select/Elements.java b/src/main/java/org/jsoup/select/Elements.java
index 31838e1f89..c344f2e06d 100644
--- a/src/main/java/org/jsoup/select/Elements.java
+++ b/src/main/java/org/jsoup/select/Elements.java
@@ -8,20 +8,23 @@
 import org.jsoup.nodes.FormElement;
 import org.jsoup.nodes.Node;
 import org.jsoup.nodes.TextNode;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
 import java.util.HashSet;
+import java.util.Iterator;
 import java.util.LinkedHashSet;
 import java.util.List;
+import java.util.function.Predicate;
+import java.util.function.UnaryOperator;
 
 /**
  A list of {@link Element}s, with methods that act on every element in the list.
- <p>
- To get an {@code Elements} object, use the {@link Element#select(String)} method.
- </p>
+ <p>To get an {@code Elements} object, use the {@link Element#select(String)} method.</p>
+ <p>Methods that {@link #set(int, Element) set}, {@link #remove(int) remove}, or {@link #replaceAll(UnaryOperator)
+ replace} Elements in the list will also act on the underlying {@link org.jsoup.nodes.Document DOM}.</p>
 
  @author Jonathan Hedley, jonathan@hedley.net */
 public class Elements extends ArrayList<Element> {
@@ -62,7 +65,7 @@ public Elements clone() {
     /**
      Get an attribute value from the first matched element that has the attribute.
      @param attributeKey The attribute key.
-     @return The attribute value from the first matched element that has the attribute.. If no elements were matched (isEmpty() == true),
+     @return The attribute value from the first matched element that has the attribute. If no elements were matched (isEmpty() == true),
      or if the no elements have the attribute, returns empty string.
      @see #hasAttr(String)
      */
@@ -431,6 +434,7 @@ public Elements empty() {
 
     /**
      * Remove each matched element from the DOM. This is similar to setting the outer HTML of each element to nothing.
+     * <p>The elements will still be retained in this list, in case further processing of them is desired.</p>
      * <p>
      * E.g. HTML: {@code <div><p>Hello</p> <p>there</p> <img /></div>}<br>
      * <code>doc.select("p").remove();</code><br>
@@ -440,6 +444,7 @@ public Elements empty() {
      * @return this, for chaining
      * @see Element#empty()
      * @see #empty()
+     * @see #clear()
      */
     public Elements remove() {
         for (Element element : this) {
@@ -683,4 +688,121 @@ private <T extends Node> List<T> childNodesOfType(Class<T> tClass) {
         return nodes;
     }
 
+    // list methods that update the DOM:
+
+    /**
+     Replace the Element at the specified index in this list, and in the DOM.
+     * @param index index of the element to replace
+     * @param element element to be stored at the specified position
+     * @return the old Element at this index
+     * @since 1.17.1
+     */
+    @Override public Element set(int index, Element element) {
+        Validate.notNull(element);
+        Element old = super.set(index, element);
+        old.replaceWith(element);
+        return old;
+    }
+
+    /**
+     Remove the Element at the specified index in this ist, and from the DOM.
+     * @param index the index of the element to be removed
+     * @return the old element at this index
+     * @since 1.17.1
+     */
+    @Override public Element remove(int index) {
+        Element old = super.remove(index);
+        old.remove();
+        return old;
+    }
+
+    /**
+     Remove the specified Element from this list, and from th DOM
+     * @param o element to be removed from this list, if present
+     * @return if this list contained the Element
+     * @since 1.17.1
+     */
+    @Override public boolean remove(Object o) {
+        int index = super.indexOf(o);
+        if (index == -1) {
+            return false;
+        } else {
+            remove(index);
+            return true;
+        }
+    }
+
+    /**
+     Removes all the elements from this list, and each of them from the DOM.
+     * @since 1.17.1
+     * @see #remove()
+     */
+    @Override public void clear() {
+        remove();
+        super.clear();
+    }
+
+    /**
+     Removes from this list, and from the DOM, each of the elements that are contained in the specified collection and
+     are in this list.
+     * @param c collection containing elements to be removed from this list
+     * @return {@code true} if elements were removed from this list
+     * @since 1.17.1
+     */
+    @Override public boolean removeAll(Collection<?> c) {
+        boolean anyRemoved = false;
+        for (Object o : c) {
+            anyRemoved |= this.remove(o);
+        }
+        return anyRemoved;
+    }
+
+    /**
+     Retain in this list, and in the DOM, only the elements that are in the specified collection and are in this list.
+     In other words, remove elements from this list and the DOM any item that is in this list but not in the specified
+     collection.
+     * @param c collection containing elements to be retained in this list
+     * @return {@code true} if elements were removed from this list
+     * @since 1.17.1
+     */
+    @Override public boolean retainAll(Collection<?> c) {
+        boolean anyRemoved = false;
+        for (Iterator<Element> it = this.iterator(); it.hasNext(); ) {
+            Element el = it.next();
+            if (!c.contains(el)) {
+                it.remove();
+                anyRemoved = true;
+            }
+        }
+        return anyRemoved;
+    }
+
+    /**
+     Remove from the list, and from the DOM, all elements in this list that mach the given filter.
+     * @param filter a predicate which returns {@code true} for elements to be removed
+     * @return {@code true} if elements were removed from this list
+     * @since 1.17.1
+     */
+    @Override public boolean removeIf(Predicate<? super Element> filter) {
+        boolean anyRemoved = false;
+        for (Iterator<Element> it = this.iterator(); it.hasNext(); ) {
+            Element el = it.next();
+            if (filter.test(el)) {
+                it.remove();
+                anyRemoved = true;
+            }
+        }
+        return anyRemoved;
+    }
+
+    /**
+     Replace each element in this list with the result of the operator, and update the DOM.
+     * @param operator the operator to apply to each element
+     * @since 1.17.1
+     */
+    @Override public void replaceAll(UnaryOperator<Element> operator) {
+        for (int i = 0; i < this.size(); i++) {
+            this.set(i, operator.apply(this.get(i)));
+        }
+    }
 }
diff --git a/src/main/java/org/jsoup/select/Evaluator.java b/src/main/java/org/jsoup/select/Evaluator.java
index 65040bcf64..24489691ae 100644
--- a/src/main/java/org/jsoup/select/Evaluator.java
+++ b/src/main/java/org/jsoup/select/Evaluator.java
@@ -12,6 +12,7 @@
 import org.jsoup.parser.ParseSettings;
 
 import java.util.List;
+import java.util.function.Predicate;
 import java.util.regex.Matcher;
 import java.util.regex.Pattern;
 
@@ -27,6 +28,16 @@ public abstract class Evaluator {
     protected Evaluator() {
     }
 
+    /**
+     Provides a Predicate for this Evaluator, matching the test Element.
+     * @param root the root Element, for match evaluation
+     * @return a predicate that accepts an Element to test for matches with this Evaluator
+     * @since 1.17.1
+     */
+    public Predicate<Element> asPredicate(Element root) {
+        return element -> matches(root, element);
+    }
+
     /**
      * Test if the element meets the evaluator's requirements.
      *
@@ -327,8 +338,8 @@ public String toString() {
      * Evaluator for attribute name/value matching (value regex matching)
      */
     public static final class AttributeWithValueMatching extends Evaluator {
-        String key;
-        Pattern pattern;
+        final String key;
+        final Pattern pattern;
 
         public AttributeWithValueMatching(String key, Pattern pattern) {
             this.key = normalize(key);
@@ -355,8 +366,8 @@ public String toString() {
      * Abstract evaluator for attribute name/value matching
      */
     public abstract static class AttributeKeyPair extends Evaluator {
-        String key;
-        String value;
+        final String key;
+        final String value;
 
         public AttributeKeyPair(String key, String value) {
             this(key, value, true);
@@ -541,12 +552,12 @@ public IsNthChild(int a, int b) {
     		super(a,b);
 		}
 
-		protected int calculatePosition(Element root, Element element) {
+		@Override protected int calculatePosition(Element root, Element element) {
 			return element.elementSiblingIndex()+1;
 		}
 
 
-		protected String getPseudoClass() {
+		@Override protected String getPseudoClass() {
 			return "nth-child";
 		}
     }
@@ -583,7 +594,7 @@ public IsNthOfType(int a, int b) {
             super(a, b);
         }
 
-        protected int calculatePosition(Element root, Element element) {
+        @Override protected int calculatePosition(Element root, Element element) {
             Element parent = element.parent();
             if (parent == null)
                 return 0;
@@ -729,7 +740,7 @@ public String toString() {
      * @author ant
      */
     public abstract static class IndexEvaluator extends Evaluator {
-        int index;
+        final int index;
 
         public IndexEvaluator(int index) {
             this.index = index;
diff --git a/src/main/java/org/jsoup/select/NodeTraversor.java b/src/main/java/org/jsoup/select/NodeTraversor.java
index 5b01a2f490..de8be092e9 100644
--- a/src/main/java/org/jsoup/select/NodeTraversor.java
+++ b/src/main/java/org/jsoup/select/NodeTraversor.java
@@ -6,16 +6,19 @@
 import org.jsoup.select.NodeFilter.FilterResult;
 
 /**
- * Depth-first node traversor. Use to iterate through all nodes under and including the specified root node.
- * <p>
- * This implementation does not use recursion, so a deep DOM does not risk blowing the stack.
- * </p>
+ A depth-first node traversor. Use to walk through all nodes under and including the specified root node, in document
+ order. The {@link NodeVisitor#head(Node, int)} and {@link NodeVisitor#tail(Node, int)} methods will be called for
+ each node.
+ <p> During traversal, structural changes to nodes are supported (e.g. {{@link Node#replaceWith(Node)},
+ {@link Node#remove()}}
+ </p>
  */
 public class NodeTraversor {
     /**
-     * Start a depth-first traverse of the root and all of its descendants.
-     * @param visitor Node visitor.
-     * @param root the root node point to traverse.
+     Run a depth-first traverse of the root and all of its descendants.
+     @param visitor Node visitor.
+     @param root the initial node point to traverse.
+     @see NodeVisitor
      */
     public static void traverse(NodeVisitor visitor, Node root) {
         Validate.notNull(visitor);
@@ -62,9 +65,9 @@ public static void traverse(NodeVisitor visitor, Node root) {
     }
 
     /**
-     * Start a depth-first traverse of all elements.
-     * @param visitor Node visitor.
-     * @param elements Elements to filter.
+     Run a depth-first traversal of each Element.
+     @param visitor Node visitor.
+     @param elements Elements to traverse.
      */
     public static void traverse(NodeVisitor visitor, Elements elements) {
         Validate.notNull(visitor);
@@ -74,10 +77,12 @@ public static void traverse(NodeVisitor visitor, Elements elements) {
     }
 
     /**
-     * Start a depth-first filtering of the root and all of its descendants.
-     * @param filter Node visitor.
-     * @param root the root node point to traverse.
-     * @return The filter result of the root node, or {@link FilterResult#STOP}.
+     Run a depth-first filtered traversal of the root and all of its descendants.
+     @param filter NodeFilter visitor.
+     @param root the root node point to traverse.
+     @return The filter result of the root node, or {@link FilterResult#STOP}.
+
+     @see NodeFilter
      */
     public static FilterResult filter(NodeFilter filter, Node root) {
         Node node = root;
@@ -128,9 +133,9 @@ public static FilterResult filter(NodeFilter filter, Node root) {
     }
 
     /**
-     * Start a depth-first filtering of all elements.
-     * @param filter Node filter.
-     * @param elements Elements to filter.
+     Run a depth-first filtered traversal of each Element.
+     @param filter NodeFilter visitor.
+     @see NodeFilter
      */
     public static void filter(NodeFilter filter, Elements elements) {
         Validate.notNull(filter);
diff --git a/src/main/java/org/jsoup/select/NodeVisitor.java b/src/main/java/org/jsoup/select/NodeVisitor.java
index 0dbdc86ce8..6fa0fa7e13 100644
--- a/src/main/java/org/jsoup/select/NodeVisitor.java
+++ b/src/main/java/org/jsoup/select/NodeVisitor.java
@@ -4,13 +4,26 @@
 import org.jsoup.nodes.Node;
 
 /**
- * Node visitor interface. Provide an implementing class to {@link NodeTraversor} to iterate through nodes.
- * <p>
- * This interface provides two methods, {@code head} and {@code tail}. The head method is called when the node is first
- * seen, and the tail method when all of the node's children have been visited. As an example, {@code head} can be used to
- * emit a start tag for a node, and {@code tail} to create the end tag.
- * </p>
+ Node visitor interface. Provide an implementing class to {@link NodeTraversor} or to {@link Node#traverse(NodeVisitor)}
+ to iterate through nodes.
+ <p>
+ This interface provides two methods, {@link #head} and {@link #tail}. The head method is called when the node is first
+ seen, and the tail method when all of the node's children have been visited. As an example, {@code head} can be used to
+ emit a start tag for a node, and {@code tail} to create the end tag. The {@code tail} method defaults to a no-op, so
+ the {@code head} method is the {@link FunctionalInterface}.
+ </p>
+ <p><b>Example:</b></p>
+ <pre><code>
+ doc.body().traverse((node, depth) -> {
+     switch (node) {
+         case Element el     -> print(el.tag() + ": " + el.ownText());
+         case DataNode data  -> print("Data: " + data.getWholeData());
+         default             -> print(node.nodeName() + " at depth " + depth);
+     }
+ });
+ </code></pre>
  */
+@FunctionalInterface
 public interface NodeVisitor {
     /**
      Callback for when a node is first visited.
diff --git a/src/main/java/org/jsoup/select/QueryParser.java b/src/main/java/org/jsoup/select/QueryParser.java
index 09f53bdd00..b495336602 100644
--- a/src/main/java/org/jsoup/select/QueryParser.java
+++ b/src/main/java/org/jsoup/select/QueryParser.java
@@ -145,18 +145,21 @@ private void combinator(char combinator) {
 
     private String consumeSubQuery() {
         StringBuilder sq = StringUtil.borrowBuilder();
+        boolean seenNonCombinator = false; // eat until we hit a combinator after eating something else
         while (!tq.isEmpty()) {
             if (tq.matches("("))
                 sq.append("(").append(tq.chompBalanced('(', ')')).append(")");
             else if (tq.matches("["))
                 sq.append("[").append(tq.chompBalanced('[', ']')).append("]");
             else if (tq.matchesAny(Combinators))
-                if (sq.length() > 0)
+                if (seenNonCombinator)
                     break;
                 else
-                    tq.consume();
-            else
+                    sq.append(tq.consume());
+            else {
+                seenNonCombinator = true;
                 sq.append(tq.consume());
+            }
         }
         return StringUtil.releaseBuilder(sq);
     }
@@ -189,6 +192,8 @@ private Evaluator parsePseudoSelector() {
                 return new Evaluator.IndexEquals(consumeIndex());
             case "has":
                 return has();
+            case "is":
+                return is();
             case "contains":
                 return contains(false);
             case "containsOwn":
@@ -365,6 +370,13 @@ private Evaluator has() {
         return new StructuralEvaluator.Has(parse(subQuery));
     }
 
+    // psuedo selector :is()
+    private Evaluator is() {
+        String subQuery = consumeParens();
+        Validate.notEmpty(subQuery, ":is(selector) sub-select must not be empty");
+        return new StructuralEvaluator.Is(parse(subQuery));
+    }
+
     // pseudo selector :contains(text), containsOwn(text)
     private Evaluator contains(boolean own) {
         String query = own ? ":containsOwn" : ":contains";
diff --git a/src/main/java/org/jsoup/select/Selector.java b/src/main/java/org/jsoup/select/Selector.java
index 95c1756097..c050ff1366 100644
--- a/src/main/java/org/jsoup/select/Selector.java
+++ b/src/main/java/org/jsoup/select/Selector.java
@@ -2,8 +2,8 @@
 
 import org.jsoup.helper.Validate;
 import org.jsoup.nodes.Element;
+import org.jspecify.annotations.Nullable;
 
-import javax.annotation.Nullable;
 import java.util.Collection;
 import java.util.IdentityHashMap;
 
@@ -47,7 +47,8 @@
  * <tr><td><code>:lt(<em>n</em>)</code></td><td>elements whose sibling index is less than <em>n</em></td><td><code>td:lt(3)</code> finds the first 3 cells of each row</td></tr>
  * <tr><td><code>:gt(<em>n</em>)</code></td><td>elements whose sibling index is greater than <em>n</em></td><td><code>td:gt(1)</code> finds cells after skipping the first two</td></tr>
  * <tr><td><code>:eq(<em>n</em>)</code></td><td>elements whose sibling index is equal to <em>n</em></td><td><code>td:eq(0)</code> finds the first cell of each row</td></tr>
- * <tr><td><code>:has(<em>selector</em>)</code></td><td>elements that contains at least one element matching the <em>selector</em></td><td><code>div:has(p)</code> finds <code>div</code>s that contain <code>p</code> elements.<br><code>div:has(&gt; a)</code> selects <code>div</code> elements that have at least one direct child <code>a</code> element.</td></tr>
+ * <tr><td><code>:has(<em>selector</em>)</code></td><td>elements that contains at least one element matching the <em>selector</em></td><td><code>div:has(p)</code> finds <code>div</code>s that contain <code>p</code> elements.<br><code>div:has(&gt; a)</code> selects <code>div</code> elements that have at least one direct child <code>a</code> element.<br><code>section:has(h1, h2)</code> finds <code>section</code> elements that contain a <code>h1</code> or a <code>h2</code> element</td></tr>
+ * <tr><td><code>:is(<em>selector list</em>)</code></td><td>elements that match any of the selectors in the selector list</td><code>:is(h1, h2, h3, h4, h5, h6)</code> finds any heading element.<br><code>:is(section, article) > :is(h1, h2)</code> finds a <code>h1</code> or <code>h2</code> that is a direct child of a <code>section</code> or an <code>article</code></td></tr>
  * <tr><td><code>:not(<em>selector</em>)</code></td><td>elements that do not match the <em>selector</em>. See also {@link Elements#not(String)}</td><td><code>div:not(.logo)</code> finds all divs that do not have the "logo" class.<p><code>div:not(:has(div))</code> finds divs that do not contain divs.</p></td></tr>
  * <tr><td><code>:contains(<em>text</em>)</code></td><td>elements that contains the specified text. The search is case insensitive. The text may appear in the found element, or any of its descendants. The text is whitespace normalized. <p>To find content that includes parentheses, escape those with a {@code \}.</p></td><td><code>p:contains(jsoup)</code> finds p elements containing the text "jsoup".<p>{@code p:contains(hello \(there\) finds p elements containing the text "Hello (There)"}</p></td></tr>
  * <tr><td><code>:containsOwn(<em>text</em>)</code></td><td>elements that directly contain the specified text. The search is case insensitive. The text must appear in the found element, not any of its descendants.</td><td><code>p:containsOwn(jsoup)</code> finds p elements with own text "jsoup".</td></tr>
diff --git a/src/main/java/org/jsoup/select/StructuralEvaluator.java b/src/main/java/org/jsoup/select/StructuralEvaluator.java
index 96ff252e5b..1e84427068 100644
--- a/src/main/java/org/jsoup/select/StructuralEvaluator.java
+++ b/src/main/java/org/jsoup/select/StructuralEvaluator.java
@@ -2,7 +2,7 @@
 
 import org.jsoup.internal.StringUtil;
 import org.jsoup.nodes.Element;
-import org.jsoup.nodes.Node;
+import org.jsoup.nodes.NodeIterator;
 
 import java.util.ArrayList;
 import java.util.IdentityHashMap;
@@ -59,23 +59,21 @@ public boolean matches(Element root, Element element) {
     }
 
     static class Has extends StructuralEvaluator {
-        final Collector.FirstFinder finder;
+        final NodeIterator<Element> it = new NodeIterator<>(new Element("html"), Element.class);
+        // the element here is just a placeholder so this can be final - gets set in restart()
 
         public Has(Evaluator evaluator) {
             super(evaluator);
-            finder = new Collector.FirstFinder(evaluator);
         }
 
-        @Override
-        public boolean matches(Element root, Element element) {
+        @Override public boolean matches(Element root, Element element) {
             // for :has, we only want to match children (or below), not the input element. And we want to minimize GCs
-            for (int i = 0; i < element.childNodeSize(); i++) {
-                Node node = element.childNode(i);
-                if (node instanceof Element) {
-                    Element match = finder.find(element, (Element) node);
-                    if (match != null)
-                        return true;
-                }
+            it.restart(element);
+            while (it.hasNext()) {
+                Element el = it.next();
+                if (el == element) continue; // don't match self, only descendants
+                if (evaluator.matches(element, el))
+                    return true;
             }
             return false;
         }
@@ -90,6 +88,27 @@ public String toString() {
         }
     }
 
+    /** Implements the :is(sub-query) pseudo-selector */
+    static class Is extends StructuralEvaluator {
+        public Is(Evaluator evaluator) {
+            super(evaluator);
+        }
+
+        @Override
+        public boolean matches(Element root, Element element) {
+            return evaluator.matches(root, element);
+        }
+
+        @Override protected int cost() {
+            return 2 + evaluator.cost();
+        }
+
+        @Override
+        public String toString() {
+            return String.format(":is(%s)", evaluator);
+        }
+    }
+
     static class Not extends StructuralEvaluator {
         public Not(Evaluator evaluator) {
             super(evaluator);
@@ -189,7 +208,9 @@ void add(Evaluator evaluator) {
 
         @Override
         public boolean matches(Element root, Element element) {
-            // evaluate from last to first
+            if (element == root)
+                return false; // cannot match as the second eval (first parent test) would be above the root
+
             for (int i = evaluators.size() -1; i >= 0; --i) {
                 if (element == null)
                     return false;
diff --git a/src/main/java/org/jsoup/select/package-info.java b/src/main/java/org/jsoup/select/package-info.java
index 5bbdb85543..34d3388aad 100644
--- a/src/main/java/org/jsoup/select/package-info.java
+++ b/src/main/java/org/jsoup/select/package-info.java
@@ -2,7 +2,7 @@
  Packages to support the CSS-style element selector.
  {@link org.jsoup.select.Selector Selector defines the query syntax.}
  */
-@NonnullByDefault
+@NullMarked
 package org.jsoup.select;
 
-import org.jsoup.internal.NonnullByDefault;
+import org.jspecify.annotations.NullMarked;
diff --git a/src/main/java9/module-info.java b/src/main/java9/module-info.java
new file mode 100644
index 0000000000..31bd333877
--- /dev/null
+++ b/src/main/java9/module-info.java
@@ -0,0 +1,11 @@
+module org.jsoup {
+    exports org.jsoup;
+    exports org.jsoup.helper;
+    exports org.jsoup.nodes;
+    exports org.jsoup.parser;
+    exports org.jsoup.safety;
+    exports org.jsoup.select;
+
+    requires transitive java.xml; // for org.w3c.dom out of W3CDom
+    requires static org.jspecify; // nullability annotations
+}
diff --git a/src/main/java9/org/jsoup/helper/RequestAuthHandler.java b/src/main/java9/org/jsoup/helper/RequestAuthHandler.java
new file mode 100644
index 0000000000..0df80de209
--- /dev/null
+++ b/src/main/java9/org/jsoup/helper/RequestAuthHandler.java
@@ -0,0 +1,24 @@
+package org.jsoup.helper;
+
+import java.net.HttpURLConnection;
+
+/**
+ A per-request authentication shim, used in Java 9+.
+ */
+class RequestAuthHandler implements AuthenticationHandler.AuthShim {
+    public RequestAuthHandler() {}
+
+    @Override public void enable(RequestAuthenticator auth, HttpURLConnection con) {
+        AuthenticationHandler authenticator = new AuthenticationHandler(auth);
+        con.setAuthenticator(authenticator);
+    }
+
+    @Override public void remove() {
+        // noop; would remove thread-local in Global Handler
+    }
+
+    @Override public AuthenticationHandler get(AuthenticationHandler helper) {
+        // would get thread-local in Global Handler
+        return helper;
+    }
+}
diff --git a/src/test/java/org/jsoup/helper/AuthenticationHandlerTest.java b/src/test/java/org/jsoup/helper/AuthenticationHandlerTest.java
new file mode 100644
index 0000000000..c0dd692d37
--- /dev/null
+++ b/src/test/java/org/jsoup/helper/AuthenticationHandlerTest.java
@@ -0,0 +1,7 @@
+package org.jsoup.helper;
+
+public class AuthenticationHandlerTest {
+    public static final int MaxAttempts = AuthenticationHandler.MaxAttempts;
+
+    // tests are in ConnectionTest, ProxyTest. This class just makes the MaxAttempts visible for test.
+}
diff --git a/src/test/java/org/jsoup/helper/HttpConnectionTest.java b/src/test/java/org/jsoup/helper/HttpConnectionTest.java
index 8df0f80397..5757d1d27a 100644
--- a/src/test/java/org/jsoup/helper/HttpConnectionTest.java
+++ b/src/test/java/org/jsoup/helper/HttpConnectionTest.java
@@ -7,7 +7,9 @@
 import org.junit.jupiter.api.Test;
 
 import java.io.IOException;
+import java.net.Authenticator;
 import java.net.MalformedURLException;
+import java.net.PasswordAuthentication;
 import java.net.URL;
 import java.util.ArrayList;
 import java.util.Collection;
@@ -373,4 +375,37 @@ public void caseInsensitiveHeaders(Locale locale) {
         String actual = connect.request().header("Key");
         assertEquals(value, actual);
     }
+
+    @Test void setAuth() throws MalformedURLException {
+        Connection con = Jsoup.newSession();
+
+        assertNull(con.request().auth());
+
+        RequestAuthenticator auth1 = new RequestAuthenticator() {
+            @Override public PasswordAuthentication authenticate(Context auth) {
+                return auth.credentials("foo", "bar");
+            }
+        };
+
+        RequestAuthenticator auth2 = new RequestAuthenticator() {
+            @Override public PasswordAuthentication authenticate(Context auth) {
+                return auth.credentials("qux", "baz");
+            }
+        };
+
+        con.auth(auth1);
+        assertSame(con.request().auth(), auth1);
+
+        con.auth(auth2);
+        assertSame(con.request().auth(), auth2);
+
+        con.request().auth(auth1);
+        assertSame(con.request().auth(), auth1);
+
+        PasswordAuthentication creds = auth1.authenticate(
+            new RequestAuthenticator.Context(new URL("http://example.com"), Authenticator.RequestorType.SERVER, "Realm"));
+        assertNotNull(creds);
+        assertEquals("foo", creds.getUserName());
+        assertEquals("bar", new String(creds.getPassword()));
+    }
 }
diff --git a/src/test/java/org/jsoup/helper/W3CDomTest.java b/src/test/java/org/jsoup/helper/W3CDomTest.java
index c1daeb57b0..fe8379aea8 100644
--- a/src/test/java/org/jsoup/helper/W3CDomTest.java
+++ b/src/test/java/org/jsoup/helper/W3CDomTest.java
@@ -345,5 +345,26 @@ public void canOutputHtmlWithoutNamespace() {
         org.jsoup.nodes.TextNode jText = (TextNode) jDiv.childNode(0).childNode(0);
         assertEquals(jText, textNode.getUserData(W3CDom.SourceProperty));
     }
+    
+    @Test public void canXmlParseCdataNodes() throws XPathExpressionException {
+        String html = "<p><script>1 && 2</script><style>3 && 4</style> 5 &amp;&amp; 6</p>";
+        org.jsoup.nodes.Document jdoc = Jsoup.parse(html);
+        jdoc.outputSettings().syntax(org.jsoup.nodes.Document.OutputSettings.Syntax.xml);
+        String xml = jdoc.body().html();
+        assertTrue(xml.contains("<script><![CDATA[")); // as asserted in ElementTest
+        Document doc = parseXml(xml, false);
+        NodeList list = xpath(doc, "//script");
+        assertEquals(1, list.getLength());
+        Node script = list.item(0); // will be the cdata node
+        assertEquals("1 && 2", script.getTextContent());
+    }
+
+    @Test public void handlesEmptyDoctype() {
+        String html = "<!doctype>Foo";
+        org.jsoup.nodes.Document jdoc = Jsoup.parse(html);
+        Document doc = (new W3CDom()).fromJsoup(jdoc);
+        assertNull(doc.getDoctype());
+        assertEquals("Foo", doc.getFirstChild().getTextContent());
+    }
 
 }
diff --git a/src/test/java/org/jsoup/integration/ConnectIT.java b/src/test/java/org/jsoup/integration/ConnectIT.java
index afd188989d..c7b63c37a9 100644
--- a/src/test/java/org/jsoup/integration/ConnectIT.java
+++ b/src/test/java/org/jsoup/integration/ConnectIT.java
@@ -2,9 +2,9 @@
 
 import org.jsoup.Connection;
 import org.jsoup.Jsoup;
+import org.jsoup.helper.DataUtil;
 import org.jsoup.integration.servlets.FileServlet;
 import org.jsoup.integration.servlets.SlowRider;
-import org.jsoup.internal.ConstrainableInputStream;
 import org.jsoup.nodes.Document;
 import org.jsoup.nodes.Element;
 import org.junit.jupiter.api.Test;
@@ -142,16 +142,13 @@ public void remainingAfterFirstRead() throws IOException {
         int capSize = 100 * 1024;
 
         String url = FileServlet.urlTo("/htmltests/large.html"); // 280 K
-        ConstrainableInputStream stream;
-        try (BufferedInputStream inputStream = Jsoup.connect(url).maxBodySize(capSize)
-            .execute().bodyStream()) {
 
-            assertTrue(inputStream instanceof ConstrainableInputStream);
-            stream = (ConstrainableInputStream) inputStream;
+        try (BufferedInputStream stream = Jsoup.connect(url).maxBodySize(capSize)
+            .execute().bodyStream()) {
 
             // simulates parse which does a limited read first
             stream.mark(bufferSize);
-            ByteBuffer firstBytes = stream.readToByteBuffer(bufferSize);
+            ByteBuffer firstBytes = DataUtil.readToByteBuffer(stream, bufferSize);
 
             byte[] array = firstBytes.array();
             String firstText = new String(array, StandardCharsets.UTF_8);
@@ -163,9 +160,13 @@ public void remainingAfterFirstRead() throws IOException {
 
             // reset and read again
             stream.reset();
-            ByteBuffer fullRead = stream.readToByteBuffer(0);
+            ByteBuffer fullRead = DataUtil.readToByteBuffer(stream, 0);
             byte[] fullArray = fullRead.array();
-            assertEquals(capSize, fullArray.length);
+
+            // bodyStream is not capped to body size - only for jsoup consumed stream
+            assertTrue(fullArray.length > capSize);
+
+            assertEquals(280735, fullArray.length);
             String fullText = new String(fullArray, StandardCharsets.UTF_8);
             assertTrue(fullText.startsWith(firstText));
         }
@@ -176,14 +177,10 @@ public void noLimitAfterFirstRead() throws IOException {
         int bufferSize = 5 * 1024;
 
         String url = FileServlet.urlTo("/htmltests/large.html"); // 280 K
-        ConstrainableInputStream stream;
-        try (BufferedInputStream inputStream = Jsoup.connect(url).execute().bodyStream()) {
-            assertTrue(inputStream instanceof ConstrainableInputStream);
-            stream = (ConstrainableInputStream) inputStream;
-
+        try (BufferedInputStream stream = Jsoup.connect(url).execute().bodyStream()) {
             // simulates parse which does a limited read first
             stream.mark(bufferSize);
-            ByteBuffer firstBytes = stream.readToByteBuffer(bufferSize);
+            ByteBuffer firstBytes = DataUtil.readToByteBuffer(stream, bufferSize);
             byte[] array = firstBytes.array();
             String firstText = new String(array, StandardCharsets.UTF_8);
             assertTrue(firstText.startsWith("<html><head><title>Large"));
@@ -191,11 +188,27 @@ public void noLimitAfterFirstRead() throws IOException {
 
             // reset and read fully
             stream.reset();
-            ByteBuffer fullRead = stream.readToByteBuffer(0);
+            ByteBuffer fullRead = DataUtil.readToByteBuffer(stream, 0);
             byte[] fullArray = fullRead.array();
             assertEquals(280735, fullArray.length);
             String fullText = new String(fullArray, StandardCharsets.UTF_8);
             assertTrue(fullText.startsWith(firstText));
         }
     }
+
+    @Test public void bodyStreamConstrainedViaBufferUp() throws IOException {
+        int cap = 5 * 1024;
+        String url = FileServlet.urlTo("/htmltests/large.html"); // 280 K
+        try (BufferedInputStream stream = Jsoup
+            .connect(url)
+            .maxBodySize(cap)
+            .execute()
+            .bufferUp()
+            .bodyStream()) {
+
+            ByteBuffer cappedRead = DataUtil.readToByteBuffer(stream, 0);
+            byte[] cappedArray = cappedRead.array();
+            assertEquals(cap, cappedArray.length);
+        }
+    }
 }
diff --git a/src/test/java/org/jsoup/integration/ConnectTest.java b/src/test/java/org/jsoup/integration/ConnectTest.java
index f02840a0cb..4b1c580c12 100644
--- a/src/test/java/org/jsoup/integration/ConnectTest.java
+++ b/src/test/java/org/jsoup/integration/ConnectTest.java
@@ -4,6 +4,7 @@
 import org.jsoup.HttpStatusException;
 import org.jsoup.Jsoup;
 import org.jsoup.Connection.Method;
+import org.jsoup.UnsupportedMimeTypeException;
 import org.jsoup.helper.DataUtil;
 import org.jsoup.helper.W3CDom;
 import org.jsoup.integration.servlets.*;
@@ -11,21 +12,31 @@
 import org.jsoup.nodes.Document;
 import org.jsoup.nodes.Element;
 import org.jsoup.nodes.FormElement;
+import org.jsoup.nodes.Node;
+import org.jsoup.nodes.XmlDeclaration;
 import org.jsoup.parser.HtmlTreeBuilder;
 import org.jsoup.parser.Parser;
 import org.jsoup.parser.XmlTreeBuilder;
 import org.junit.jupiter.api.BeforeAll;
 import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.MethodSource;
 
+import javax.servlet.http.HttpServletResponse;
 import java.io.File;
 import java.io.FileInputStream;
 import java.io.IOException;
+import java.net.Authenticator;
 import java.net.MalformedURLException;
 import java.net.URL;
 import java.net.URLDecoder;
+import java.nio.file.Files;
 import java.util.List;
 import java.util.Map;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.stream.Stream;
 
+import static org.jsoup.helper.AuthenticationHandlerTest.MaxAttempts;
 import static org.jsoup.helper.HttpConnection.CONTENT_TYPE;
 import static org.jsoup.helper.HttpConnection.MULTIPART_FORM_DATA;
 import static org.jsoup.integration.UrlConnectTest.browserUa;
@@ -51,6 +62,13 @@ public void canConnectToLocalServer() throws IOException {
         assertEquals("Hello, World!", p.text());
     }
 
+    @Test void canConnectToLocalTlsServer() throws IOException {
+        String url = HelloServlet.TlsUrl;
+        Document doc = Jsoup.connect(url).get();
+        Element p = doc.selectFirst("p");
+        assertEquals("Hello, World!", p.text());
+    }
+
     @Test
     public void fetchURl() throws IOException {
         Document doc = Jsoup.parse(new URL(echoUrl), 10 * 1000);
@@ -78,7 +96,7 @@ public void exceptOnUnsupportedProtocol() {
         assertTrue(threw);
     }
 
-    private static String ihVal(String key, Document doc) {
+    static String ihVal(String key, Document doc) {
         final Element first = doc.select("th:contains(" + key + ") + td").first();
         return first != null ? first.text() : null;
     }
@@ -283,16 +301,16 @@ public void doesDeleteWithoutBody() throws IOException {
     /**
      * Tests upload of content to a remote service.
      */
-    @Test
-    public void postFiles() throws IOException {
+    @ParameterizedTest @MethodSource("echoUrls") // http and https
+    public void postFiles(String url) throws IOException {
         File thumb = ParseTest.getFile("/htmltests/thumb.jpg");
         File html = ParseTest.getFile("/htmltests/large.html");
 
         Document res = Jsoup
-            .connect(EchoServlet.Url)
+            .connect(url)
             .data("firstname", "Jay")
-            .data("firstPart", thumb.getName(), new FileInputStream(thumb), "image/jpeg")
-            .data("secondPart", html.getName(), new FileInputStream(html)) // defaults to "application-octetstream";
+            .data("firstPart", thumb.getName(), Files.newInputStream(thumb.toPath()), "image/jpeg")
+            .data("secondPart", html.getName(), Files.newInputStream(html.toPath())) // defaults to "application-octetstream";
             .data("surname", "Soup")
             .post();
 
@@ -403,7 +421,7 @@ public void multiCookieSet() throws IOException {
 
     @Test
     public void supportsDeflate() throws IOException {
-        Connection.Response res = Jsoup.connect(Deflateservlet.Url).execute();
+        Connection.Response res = Jsoup.connect(DeflateServlet.Url).execute();
         assertEquals("deflate", res.header("Content-Encoding"));
 
         Document doc = res.parse();
@@ -494,7 +512,7 @@ public void handlesWrongContentLengthDuringBufferedRead() throws IOException {
     }
 
     @Test
-    public void testBinaryContentTypeThrowsException() {
+    public void testBinaryContentTypeThrowsException() throws IOException {
         Connection con = Jsoup.connect(FileServlet.urlTo("/htmltests/thumb.jpg"));
         con.data(FileServlet.ContentTypeParam, "image/jpeg");
 
@@ -502,9 +520,9 @@ public void testBinaryContentTypeThrowsException() {
         try {
             con.execute();
             Document doc = con.response().parse();
-        } catch (IOException e) {
+        } catch (UnsupportedMimeTypeException e) {
             threw = true;
-            assertEquals("Unhandled content type. Must be text/*, application/xml, or application/*+xml", e.getMessage());
+            assertEquals("Unhandled content type. Must be text/*, */xml, or */*+xml", e.getMessage());
         }
         assertTrue(threw);
     }
@@ -525,6 +543,26 @@ public void testBinaryContentTypeThrowsException() {
         assertEquals(Document.OutputSettings.Syntax.xml, doc.outputSettings().syntax());
     }
 
+    @Test public void imageXmlMimeType() throws IOException {
+        // test that we switch to XML, and that we support image/svg+xml
+        String mimetype = "image/svg+xml";
+
+        Connection con = Jsoup.connect(FileServlet.urlTo("/htmltests/osi-logo.svg"))
+            .data(FileServlet.ContentTypeParam, mimetype);
+        Document doc = con.get();
+
+        assertEquals(mimetype, con.response().contentType());
+        assertTrue(doc.parser().getTreeBuilder() instanceof XmlTreeBuilder);
+        assertEquals(Document.OutputSettings.Syntax.xml, doc.outputSettings().syntax());
+        Node firstChild = doc.firstChild();
+        XmlDeclaration decl = (XmlDeclaration) firstChild;
+        assertEquals("no", decl.attr("standalone"));
+        Element svg = doc.expectFirst("svg");
+        Element flowRoot = svg.expectFirst("flowRoot");
+        assertEquals("flowRoot", flowRoot.tagName());
+        assertEquals("preserve", flowRoot.attr("xml:space"));
+    }
+
     @Test
     public void canFetchBinaryAsBytes() throws IOException {
         Connection.Response res = Jsoup.connect(FileServlet.urlTo("/htmltests/thumb.jpg"))
@@ -734,11 +772,11 @@ public void maxBodySizeInReadToByteBuffer() throws IOException {
         assertEquals("", ihVal("Query String", resultDoc));
 
         // new request to echo, should not have form data, but should have cookies from implicit session
-        Document newEcho = submit.newRequest().url(echoUrl).get();
+        Document newEcho = submit.newRequest(echoUrl).get();
         assertEquals("One=EchoServlet; One=Root", ihVal("Cookie", newEcho));
         assertEquals("", ihVal("Query String", newEcho));
 
-        Document cookieDoc = submit.newRequest().url(cookieUrl).get();
+        Document cookieDoc = submit.newRequest(cookieUrl).get();
         assertEquals("CookieServlet", ihVal("One", cookieDoc)); // different cookie path
 
     }
@@ -749,7 +787,7 @@ public void maxBodySizeInReadToByteBuffer() throws IOException {
         String startUrl = FileServlet.urlTo("/htmltests/form-tests.html");
 
         Connection session = Jsoup.newSession();
-        Document loginDoc = session.newRequest().url(startUrl).get();
+        Document loginDoc = session.newRequest(startUrl).get();
         FormElement form = loginDoc.expectForm("#login2");
         assertNotNull(form);
         String username = "admin";
@@ -766,7 +804,7 @@ public void maxBodySizeInReadToByteBuffer() throws IOException {
         assertEquals(Connection.Method.POST, postRes.method());
         Document resultDoc = postRes.parse();
 
-        Document echo2 = resultDoc.connection().newRequest().url(echoUrl).get();
+        Document echo2 = resultDoc.connection().newRequest(echoUrl).get();
         assertEquals("", ihVal("Query String", echo2)); // should not re-send the data
         assertEquals("One=EchoServlet; One=Root", ihVal("Cookie", echo2));
     }
@@ -786,4 +824,77 @@ public void maxBodySizeInReadToByteBuffer() throws IOException {
         assertEquals("%E9%8D%B5=%E5%80%A4", ihVal("Query String", doc));
         assertEquals("鍵=値", URLDecoder.decode(ihVal("Query String", doc), DataUtil.UTF_8.name()));
     }
+
+    /**
+     Provides HTTP and HTTPS EchoServlet URLs
+     */
+    private static Stream<String> echoUrls() {
+        return Stream.of(EchoServlet.Url, EchoServlet.TlsUrl);
+    }
+
+    @ParameterizedTest @MethodSource("echoUrls")
+    void failsIfNotAuthenticated(String url) throws IOException {
+        String password = AuthFilter.newServerPassword(); // we don't send it, but ensures cache won't hit
+        Connection.Response res = Jsoup.connect(url)
+            .header(AuthFilter.WantsServerAuthentication, "1")
+            .ignoreHttpErrors(true)
+            .execute();
+
+        assertEquals(401, res.statusCode());
+    }
+
+    @ParameterizedTest @MethodSource("echoUrls")
+    void canAuthenticate(String url) throws IOException {
+        AtomicInteger count = new AtomicInteger(0);
+        String password = AuthFilter.newServerPassword();
+        Connection.Response res = Jsoup.connect(url)
+            .header(AuthFilter.WantsServerAuthentication, "1")
+            .auth(ctx -> {
+                count.incrementAndGet();
+                assertEquals(Authenticator.RequestorType.SERVER, ctx.type());
+                assertEquals("localhost", ctx.url().getHost());
+                assertEquals(AuthFilter.ServerRealm, ctx.realm());
+
+                return ctx.credentials(AuthFilter.ServerUser, password);
+            })
+            .execute();
+
+        assertEquals(1, count.get());
+
+        Document doc = res.parse();
+        assertTrue(ihVal("Authorization", doc).startsWith("Basic ")); // tests we set the auth header
+    }
+
+    @ParameterizedTest @MethodSource("echoUrls")
+    void incorrectAuth(String url) throws IOException {
+        Connection session = Jsoup.newSession()
+            .header(AuthFilter.WantsServerAuthentication, "1")
+            .ignoreHttpErrors(true);
+
+        String password = AuthFilter.newServerPassword();
+        int code = session.newRequest(url).execute().statusCode(); // no auth sent
+        assertEquals(HttpServletResponse.SC_UNAUTHORIZED, code);
+
+        AtomicInteger count = new AtomicInteger(0);
+        Connection.Response res = session.newRequest(url)
+            .auth(ctx -> {
+                count.incrementAndGet();
+                return ctx.credentials(AuthFilter.ServerUser, password + "wrong"); // incorrect
+            })
+            .execute();
+        assertEquals(MaxAttempts, count.get());
+        assertEquals(HttpServletResponse.SC_UNAUTHORIZED, res.statusCode());
+
+        AtomicInteger successCount = new AtomicInteger(0);
+        Connection.Response successRes = session.newRequest(url)
+            .auth(ctx -> {
+                successCount.incrementAndGet();
+                return ctx.credentials(AuthFilter.ServerUser, password); // correct
+            })
+            .execute();
+        assertEquals(1, successCount.get());
+        assertEquals(HttpServletResponse.SC_OK, successRes.statusCode());
+    }
+
+    // proxy connection tests are in ProxyTest
 }
diff --git a/src/test/java/org/jsoup/integration/FuzzFixesIT.java b/src/test/java/org/jsoup/integration/FuzzFixesIT.java
index a03758dd67..d528eda793 100644
--- a/src/test/java/org/jsoup/integration/FuzzFixesIT.java
+++ b/src/test/java/org/jsoup/integration/FuzzFixesIT.java
@@ -4,6 +4,7 @@
 import org.jsoup.nodes.Document;
 import org.jsoup.parser.Parser;
 import org.junit.jupiter.api.Assertions;
+import org.junit.jupiter.api.Disabled;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.MethodSource;
 
@@ -31,6 +32,7 @@ private static Stream<File> testFiles() {
         return Stream.of(files);
     }
 
+    @Disabled // disabled, as these soak up build time and the outcome oughtn't change unless we are refactoring the tree builders. manually execute as desired.
     @ParameterizedTest
     @MethodSource("testFiles")
     void testHtmlParse(File file) throws IOException {
@@ -44,7 +46,8 @@ void testHtmlParse(File file) throws IOException {
                 Assertions.fail(String.format("Timeout: only completed %d iters of [%s] in %d seconds", i, file.getName(), timeout));
         }
     }
-
+    
+    @Disabled // disabled, as these soak up build time and the outcome oughtn't change unless we are refactoring the tree builders. manually execute as desired.
     @ParameterizedTest
     @MethodSource("testFiles")
     void testXmlParse(File file) throws IOException {
diff --git a/src/test/java/org/jsoup/integration/ProxyTest.java b/src/test/java/org/jsoup/integration/ProxyTest.java
new file mode 100644
index 0000000000..18c1a60b49
--- /dev/null
+++ b/src/test/java/org/jsoup/integration/ProxyTest.java
@@ -0,0 +1,170 @@
+package org.jsoup.integration;
+
+import org.jsoup.Connection;
+import org.jsoup.Jsoup;
+import org.jsoup.integration.servlets.AuthFilter;
+import org.jsoup.integration.servlets.EchoServlet;
+import org.jsoup.integration.servlets.FileServlet;
+import org.jsoup.integration.servlets.HelloServlet;
+import org.jsoup.integration.servlets.ProxyServlet;
+import org.jsoup.integration.servlets.RedirectServlet;
+import org.jsoup.nodes.Document;
+import org.jsoup.nodes.Element;
+import org.junit.jupiter.api.BeforeAll;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.MethodSource;
+
+import javax.servlet.http.HttpServletResponse;
+import java.io.IOException;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.stream.Stream;
+
+import static org.jsoup.helper.AuthenticationHandlerTest.MaxAttempts;
+import static org.jsoup.integration.ConnectTest.ihVal;
+import static org.junit.jupiter.api.Assertions.*;
+
+/**
+ Tests Jsoup.connect proxy support */
+public class ProxyTest {
+    private static String echoUrl;
+    private static TestServer.ProxySettings proxy;
+
+    @BeforeAll
+    public static void setUp() {
+        echoUrl = EchoServlet.Url;
+        proxy = ProxyServlet.ProxySettings;
+    }
+
+    @ParameterizedTest @MethodSource("helloUrls")
+    void fetchViaProxy(String url) throws IOException {
+        Connection con = Jsoup.connect(url)
+            .proxy(proxy.hostname, proxy.port);
+
+        Connection.Response res = con.execute();
+        if (url.startsWith("http:/")) assertVia(res); // HTTPS CONNECT won't have Via
+
+        Document doc = res.parse();
+        Element p = doc.expectFirst("p");
+        assertEquals("Hello, World!", p.text());
+    }
+
+    private static Stream<String> helloUrls() {
+        return Stream.of(HelloServlet.Url, HelloServlet.TlsUrl);
+    }
+
+    private static Stream<String> echoUrls() {
+        return Stream.of(EchoServlet.Url, EchoServlet.TlsUrl);
+    }
+
+    private static void assertVia(Connection.Response res) {
+        assertEquals(res.header("Via"), ProxyServlet.Via);
+    }
+
+    @Test void redirectViaProxy() throws IOException {
+        Connection.Response res = Jsoup
+            .connect(RedirectServlet.Url)
+            .data(RedirectServlet.LocationParam, echoUrl)
+            .header("Random-Header-name", "hello")
+            .proxy(proxy.hostname, proxy.port)
+            .execute();
+
+        assertVia(res);
+        Document doc = res.parse();
+        assertEquals(echoUrl, doc.location());
+        assertEquals("hello", ihVal("Random-Header-name", doc));
+        assertVia(res);
+    }
+
+    @Test void proxyForSession() throws IOException {
+        Connection session = Jsoup.newSession().proxy(proxy.hostname, proxy.port);
+
+        Connection.Response medRes = session.newRequest(FileServlet.urlTo("/htmltests/medium.html")).execute();
+        Connection.Response largeRes = session.newRequest(FileServlet.urlTo("/htmltests/large.html")).execute();
+
+        assertVia(medRes);
+        assertVia(largeRes);
+        assertEquals("Medium HTML", medRes.parse().title());
+        assertEquals("Large HTML", largeRes.parse().title());
+
+        Connection.Response smedRes = session.newRequest(FileServlet.tlsUrlTo("/htmltests/medium.html")).execute();
+        Connection.Response slargeRes = session.newRequest(FileServlet.tlsUrlTo("/htmltests/large.html")).execute();
+
+        assertEquals("Medium HTML", smedRes.parse().title());
+        assertEquals("Large HTML", slargeRes.parse().title());
+    }
+
+    @ParameterizedTest @MethodSource("echoUrls")
+    void canAuthenticateToProxy(String url) throws IOException {
+        int closed = TestServer.closeAuthedProxyConnections(); // reset any existing authed connections from previous tests, so we can test the auth flow
+
+        // the proxy wants auth, but not the server. HTTP and HTTPS, so tests direct proxy and CONNECT
+        Connection session = Jsoup.newSession()
+            .proxy(proxy.hostname, proxy.authedPort).ignoreHttpErrors(true);
+        String password = AuthFilter.newProxyPassword();
+
+        // fail first
+        try {
+            Connection.Response execute = session.newRequest(url)
+                .execute();
+            int code = execute.statusCode(); // no auth sent
+            assertEquals(HttpServletResponse.SC_PROXY_AUTHENTICATION_REQUIRED, code);
+        } catch (IOException e) {
+            // in CONNECT (for the HTTPS url), URLConnection will throw the proxy connect as a Stringly typed IO exception - "Unable to tunnel through proxy. Proxy returns "HTTP/1.1 407 Proxy Authentication Required"". (Not a response code)
+            assertTrue(e.getMessage().contains("407"));
+        }
+
+        try {
+            AtomicInteger count = new AtomicInteger(0);
+            Connection.Response res = session.newRequest(url)
+                .auth(ctx -> {
+                    count.incrementAndGet();
+                    return ctx.credentials(AuthFilter.ProxyUser, password + "wrong"); // incorrect
+                })
+                .execute();
+            assertEquals(MaxAttempts, count.get());
+            assertEquals(HttpServletResponse.SC_PROXY_AUTHENTICATION_REQUIRED, res.statusCode());
+        } catch (IOException e) {
+            assertTrue(e.getMessage().contains("407"));
+        }
+
+        AtomicInteger successCount = new AtomicInteger(0);
+        Connection.Response successRes = session.newRequest(url)
+            .auth(ctx -> {
+                successCount.incrementAndGet();
+                return ctx.credentials(AuthFilter.ProxyUser, password); // correct
+            })
+            .execute();
+        assertEquals(1, successCount.get());
+        assertEquals(HttpServletResponse.SC_OK, successRes.statusCode());
+    }
+
+    @ParameterizedTest @MethodSource("echoUrls")
+    void canAuthToProxyAndServer(String url) throws IOException {
+        String serverPassword = AuthFilter.newServerPassword();
+        String proxyPassword = AuthFilter.newProxyPassword();
+        AtomicInteger count = new AtomicInteger(0);
+
+        Connection session = Jsoup.newSession() // both proxy and server will want auth
+            .proxy(proxy.hostname, proxy.authedPort)
+            .header(AuthFilter.WantsServerAuthentication, "1")
+            .auth(auth -> {
+                count.incrementAndGet();
+
+                if (auth.isServer()) {
+                    assertEquals(url, auth.url().toString());
+                    assertEquals(AuthFilter.ServerRealm, auth.realm());
+                    return auth.credentials(AuthFilter.ServerUser, serverPassword);
+                } else {
+                    assertTrue(auth.isProxy());
+                    return auth.credentials(AuthFilter.ProxyUser, proxyPassword);
+                }
+            });
+
+
+        Connection.Response res = session.newRequest(url).execute();
+        assertEquals(200, res.statusCode());
+        assertEquals(2, count.get()); // hit server and proxy auth stages
+        assertEquals("Webserver Environment Variables", res.parse().title());
+    }
+}
diff --git a/src/test/java/org/jsoup/integration/TestServer.java b/src/test/java/org/jsoup/integration/TestServer.java
index fa370d1524..777ccd3050 100644
--- a/src/test/java/org/jsoup/integration/TestServer.java
+++ b/src/test/java/org/jsoup/integration/TestServer.java
@@ -1,42 +1,188 @@
 package org.jsoup.integration;
 
+import org.eclipse.jetty.http.HttpVersion;
+import org.eclipse.jetty.server.Connector;
+import org.eclipse.jetty.server.HttpConfiguration;
+import org.eclipse.jetty.server.HttpConnectionFactory;
+import org.eclipse.jetty.server.SecureRequestCustomizer;
 import org.eclipse.jetty.server.Server;
 import org.eclipse.jetty.server.ServerConnector;
+import org.eclipse.jetty.server.SslConnectionFactory;
+import org.eclipse.jetty.server.handler.HandlerWrapper;
+import org.eclipse.jetty.servlet.FilterHolder;
+import org.eclipse.jetty.servlet.FilterMapping;
 import org.eclipse.jetty.servlet.ServletHandler;
+import org.eclipse.jetty.util.ssl.SslContextFactory;
+import org.jsoup.integration.servlets.AuthFilter;
 import org.jsoup.integration.servlets.BaseServlet;
+import org.jsoup.integration.servlets.ProxyServlet;
 
+import javax.net.ssl.HttpsURLConnection;
+import javax.net.ssl.SSLContext;
+import javax.net.ssl.SSLSocketFactory;
+import javax.net.ssl.TrustManager;
+import javax.net.ssl.TrustManagerFactory;
+import java.io.File;
+import java.io.FileNotFoundException;
+import java.io.IOException;
 import java.net.InetSocketAddress;
+import java.nio.file.Files;
+import java.security.KeyManagementException;
+import java.security.KeyStore;
+import java.security.KeyStoreException;
+import java.security.NoSuchAlgorithmException;
+import java.security.cert.CertificateException;
+import java.util.concurrent.atomic.AtomicInteger;
 
 public class TestServer {
-    private static final Server jetty = new Server(new InetSocketAddress("localhost", 0));
-    private static final ServletHandler handler = new ServletHandler();
+    static int Port;
+    static int TlsPort;
+
+    private static final String Localhost = "localhost";
+    private static final String KeystorePassword = "hunter2";
+
+    private static final Server Jetty = newServer();
+    private static final ServletHandler JettyHandler = new ServletHandler();
+    private static final Server Proxy = newServer();
+    private static final Server AuthedProxy = newServer();
+    private static final HandlerWrapper ProxyHandler = new HandlerWrapper();
+    private static final HandlerWrapper AuthedProxyHandler = new HandlerWrapper();
+    private static final ProxySettings ProxySettings = new ProxySettings();
+
+    private static Server newServer() {
+        return new Server(new InetSocketAddress(Localhost, 0));
+    }
 
     static {
-        jetty.setHandler(handler);
+        Jetty.setHandler(JettyHandler);
+        Proxy.setHandler(ProxyHandler);
+        AuthedProxy.setHandler(AuthedProxyHandler);
+
+        // TLS setup:
+        try {
+            File keystoreFile = ParseTest.getFile("/local-cert/server.pfx");
+            if (!keystoreFile.exists()) throw new FileNotFoundException(keystoreFile.toString());
+            addHttpsConnector(keystoreFile, Jetty);
+            setupDefaultTrust(keystoreFile);
+        } catch (Exception e) {
+            throw new IllegalStateException(e);
+        }
     }
 
     private TestServer() {
     }
 
     public static void start() {
-        synchronized (jetty) {
+        synchronized (Jetty) {
+            if (Jetty.isStarted()) return;
+
             try {
-                jetty.start(); // jetty will safely no-op a start on an already running instance
+                Jetty.start();
+                JettyHandler.addFilterWithMapping(new FilterHolder(new AuthFilter(false, false)), "/*", FilterMapping.ALL);
+                Connector[] jcons = Jetty.getConnectors();
+                Port = ((ServerConnector) jcons[0]).getLocalPort();
+                TlsPort = ((ServerConnector) jcons[1]).getLocalPort();
+
+                ProxyHandler.setHandler(ProxyServlet.createHandler(false)); // includes proxy, CONNECT proxy, and Auth filters
+                Proxy.start();
+                ProxySettings.port = ((ServerConnector) Proxy.getConnectors()[0]).getLocalPort();
+
+                AuthedProxyHandler.setHandler(ProxyServlet.createHandler(true));
+                AuthedProxy.start();
+                ProxySettings.authedPort = ((ServerConnector) AuthedProxy.getConnectors()[0]).getLocalPort();
             } catch (Exception e) {
                 throw new IllegalStateException(e);
             }
         }
     }
 
-    public static String map(Class<? extends BaseServlet> servletClass) {
-        synchronized (jetty) {
-            if (!jetty.isStarted())
+    /**
+     Close any current connections to the authed proxy. Tunneled connections only authenticate in their first
+     CONNECT, and may be kept alive and reused. So when we want to test unauthed - authed flows, we need to disconnect
+     them first.
+     */
+    static int closeAuthedProxyConnections() {
+        ServerConnector connector = (ServerConnector) AuthedProxy.getConnectors()[0];
+        AtomicInteger count = new AtomicInteger();
+        connector.getConnectedEndPoints().forEach(endPoint -> {
+            endPoint.close();
+            count.getAndIncrement();
+        });
+        return count.get();
+    }
+
+    public static ServletUrls map(Class<? extends BaseServlet> servletClass) {
+        synchronized (Jetty) {
+            if (!Jetty.isStarted())
                 start(); // if running out of the test cases
 
             String path = "/" + servletClass.getSimpleName();
-            handler.addServletWithMapping(servletClass, path + "/*");
-            int port = ((ServerConnector) jetty.getConnectors()[0]).getLocalPort();
-            return "http://localhost:" + port + path;
+            JettyHandler.addServletWithMapping(servletClass, path + "/*");
+            String url = "http://" + Localhost + ":" + Port + path;
+            String tlsUrl = "https://" + Localhost + ":" + TlsPort + path;
+
+            return new ServletUrls(url, tlsUrl);
+        }
+    }
+
+    public static class ServletUrls {
+        public final String url;
+        public final String tlsUrl;
+
+        public ServletUrls(String url, String tlsUrl) {
+            this.url = url;
+            this.tlsUrl = tlsUrl;
         }
     }
+
+    public static ProxySettings proxySettings() {
+        synchronized (Jetty) {
+            if (!Jetty.isStarted())
+                start();
+
+            return ProxySettings;
+        }
+    }
+
+    //public static String proxy
+    public static class ProxySettings {
+        final String hostname = Localhost;
+        int port;
+        int authedPort;
+    }
+
+    private static void addHttpsConnector(File keystoreFile, Server server) {
+        // Cribbed from https://github.com/jetty/jetty.project/blob/jetty-9.4.x/examples/embedded/src/main/java/org/eclipse/jetty/embedded/LikeJettyXml.java
+        SslContextFactory sslContextFactory = new SslContextFactory.Server();
+        String path = keystoreFile.getAbsolutePath();
+        sslContextFactory.setKeyStorePath(path);
+        sslContextFactory.setKeyStorePassword(KeystorePassword);
+        sslContextFactory.setKeyManagerPassword(KeystorePassword);
+        sslContextFactory.setTrustStorePath(path);
+        sslContextFactory.setTrustStorePassword(KeystorePassword);
+
+        HttpConfiguration httpConfig = new HttpConfiguration();
+        httpConfig.setSecureScheme("https");
+        HttpConfiguration httpsConfig = new HttpConfiguration(httpConfig);
+        httpsConfig.addCustomizer(new SecureRequestCustomizer());
+
+        ServerConnector sslConnector = new ServerConnector(
+            server,
+            new SslConnectionFactory(sslContextFactory, HttpVersion.HTTP_1_1.asString()),
+            new HttpConnectionFactory(httpsConfig));
+        server.addConnector(sslConnector);
+    }
+
+    private static void setupDefaultTrust(File keystoreFile) throws KeyStoreException, IOException, NoSuchAlgorithmException, CertificateException, KeyManagementException {
+        // Configure HttpsUrlConnection (jsoup) to trust (only) this cert
+        KeyStore trustStore = KeyStore.getInstance(KeyStore.getDefaultType());
+        trustStore.load(Files.newInputStream(keystoreFile.toPath()), KeystorePassword.toCharArray());
+        TrustManagerFactory trustManagerFactory = TrustManagerFactory.getInstance(TrustManagerFactory.getDefaultAlgorithm());
+        trustManagerFactory.init(trustStore);
+        TrustManager[] managers = trustManagerFactory.getTrustManagers();
+        SSLContext tls = SSLContext.getInstance("TLS");
+        tls.init(null, managers, null);
+        SSLSocketFactory socketFactory = tls.getSocketFactory();
+        HttpsURLConnection.setDefaultSSLSocketFactory(socketFactory);
+    }
 }
diff --git a/src/test/java/org/jsoup/integration/servlets/AuthFilter.java b/src/test/java/org/jsoup/integration/servlets/AuthFilter.java
new file mode 100644
index 0000000000..7ad700924f
--- /dev/null
+++ b/src/test/java/org/jsoup/integration/servlets/AuthFilter.java
@@ -0,0 +1,107 @@
+package org.jsoup.integration.servlets;
+
+import javax.servlet.Filter;
+import javax.servlet.FilterChain;
+import javax.servlet.FilterConfig;
+import javax.servlet.ServletException;
+import javax.servlet.ServletRequest;
+import javax.servlet.ServletResponse;
+import javax.servlet.http.HttpServletRequest;
+import javax.servlet.http.HttpServletResponse;
+import java.io.IOException;
+import java.nio.charset.StandardCharsets;
+import java.util.Base64;
+
+/**
+ A filter to test basic authenticated requests. If the request header "X-Wants-Authentication" is set, or if
+ alwaysWantsAuth is enabled, the filter is invoked, and requests must send the correct user authentication details.
+ */
+public class AuthFilter implements Filter {
+    public static final String WantsServerAuthentication = "X-Wants-ServerAuthentication";
+    public static final String ServerUser = "admin";
+    public static final String ServerRealm = "jsoup test server authentication realm";
+    private static volatile String ServerPassword = newServerPassword();
+
+    public static final String WantsProxyAuthentication = "X-Wants-ProxyAuthentication";
+    public static final String ProxyUser = "foxyproxy";
+    public static final String ProxyRealm = "jsoup test proxy authentication realm";
+    private static volatile String ProxyPassword = newProxyPassword();
+
+    private final boolean alwaysWantsAuth; // we run a particular port that always wants auth - so the CONNECT tunnels can be authed. (The Java proxy tunnel CONNECT request strips the wants-auth headers)
+    private final boolean forProxy;
+    private final String wantsHeader;
+    private final String authorizationHeader;
+
+    /**
+     Creates an Authentication Filter with hardcoded credential expectations.
+     * @param alwaysWantsAuth true if this filter should always check for authentication, regardless of the Wants Auth header
+     * @param forProxy true if this wraps a Proxy and should use Proxy-Authenticate headers, credentials etc. False
+     * if wrapping the web server.
+     */
+    public AuthFilter(boolean alwaysWantsAuth, boolean forProxy) {
+        this.alwaysWantsAuth = alwaysWantsAuth;
+        this.forProxy = forProxy;
+
+        wantsHeader = forProxy ? WantsProxyAuthentication : WantsServerAuthentication;
+        authorizationHeader = forProxy ? "Proxy-Authorization" : "Authorization";
+    }
+
+    private static String newPassword() {
+        return "pass-" + Math.random();
+    }
+
+    // passwords get rotated in tests so that Java's auth cache is invalidated and a new auth callback occurs.
+    // requires tests hitting these are called serially.
+    public static String newServerPassword() {
+        return ServerPassword = newPassword() + "-server";
+    }
+
+    public static String newProxyPassword() {
+        return ProxyPassword = newPassword() + "-proxy";
+    }
+
+    @Override public void init(FilterConfig filterConfig) throws ServletException {}
+
+    @Override
+    public void doFilter(ServletRequest request, ServletResponse response, FilterChain chain) throws IOException, ServletException {
+        HttpServletRequest req = (HttpServletRequest) request;
+        HttpServletResponse res = (HttpServletResponse) response;
+
+        boolean accessGranted = checkAuth(req);
+        if (accessGranted) {
+            chain.doFilter(request, response);
+            return;
+        }
+
+        // Wants but failed auth - send appropriate header:
+        if (forProxy) {
+            res.setHeader("Proxy-Authenticate", "Basic realm=\"" + ProxyRealm + "\"");
+            // ^^ Duped in ProxyServlet for CONNECT
+            res.sendError(HttpServletResponse.SC_PROXY_AUTHENTICATION_REQUIRED);
+        } else {
+            res.setHeader("WWW-Authenticate", "Basic realm=\"" + ServerRealm + "\"");
+            res.sendError(HttpServletResponse.SC_UNAUTHORIZED);
+        }
+    }
+
+    @Override public void destroy() {}
+
+    public boolean checkAuth(HttpServletRequest req) {
+        if (alwaysWantsAuth || req.getHeader(wantsHeader) != null) {
+            String authHeader = req.getHeader(authorizationHeader);
+            if (authHeader != null) {
+                int space = authHeader.indexOf(' ');
+                if (space > 0) {
+                    String value = authHeader.substring(space + 1);
+                    String expected = forProxy ?
+                        (ProxyUser + ":" + ProxyPassword) :
+                        (ServerUser + ":" + ServerPassword);
+                    String base64 = Base64.getEncoder().encodeToString(expected.getBytes(StandardCharsets.UTF_8));
+                    return base64.equals(value); // if passed auth
+                }
+            }
+            return false; // unexpected header value
+        }
+        return true; // auth not required
+    }
+}
diff --git a/src/test/java/org/jsoup/integration/servlets/BaseServlet.java b/src/test/java/org/jsoup/integration/servlets/BaseServlet.java
index 46d8e477e0..57acca8fe7 100644
--- a/src/test/java/org/jsoup/integration/servlets/BaseServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/BaseServlet.java
@@ -9,24 +9,25 @@
 public abstract class BaseServlet extends HttpServlet {
     static final String TextHtml = "text/html; charset=UTF-8";
 
-    // these are overridden just to get the response name to be 'res' not 'resp'
+    abstract protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException;
+
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        super.doGet(req, res);
+    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException {
+        doIt(req, res);
     }
 
     @Override
-    protected void doPost(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        super.doPost(req, res);
+    protected void doPost(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException {
+        doIt(req, res);
     }
 
     @Override
-    protected void doPut(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        super.doPut(req, res);
+    protected void doPut(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException {
+        doIt(req, res);
     }
 
     @Override
-    protected void doDelete(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        super.doPut(req, res);
+    protected void doDelete(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException {
+        doIt(req, res);
     }
 }
diff --git a/src/test/java/org/jsoup/integration/servlets/CookieServlet.java b/src/test/java/org/jsoup/integration/servlets/CookieServlet.java
index 2249f971d8..ef5955f56b 100644
--- a/src/test/java/org/jsoup/integration/servlets/CookieServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/CookieServlet.java
@@ -2,35 +2,25 @@
 
 import org.jsoup.integration.TestServer;
 
-import javax.servlet.ServletException;
 import javax.servlet.http.Cookie;
 import javax.servlet.http.HttpServletRequest;
 import javax.servlet.http.HttpServletResponse;
 import java.io.IOException;
 import java.io.PrintWriter;
 
-public class CookieServlet extends BaseServlet{
-    public static final String Url = TestServer.map(CookieServlet.class);
+public class CookieServlet extends BaseServlet {
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(CookieServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
     public static final String SetCookiesParam = "setCookies";
     public static final String LocationParam = "loc";
 
-
-    @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
-    }
-
     @Override
-    protected void doPost(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
-    }
-
-    @Override
-    protected void doPut(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
-    }
-
-    private void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         // Do we want to set cookies?
         if (req.getParameter(SetCookiesParam) != null)
             setCookies(res);
diff --git a/src/test/java/org/jsoup/integration/servlets/Deflateservlet.java b/src/test/java/org/jsoup/integration/servlets/DeflateServlet.java
similarity index 74%
rename from src/test/java/org/jsoup/integration/servlets/Deflateservlet.java
rename to src/test/java/org/jsoup/integration/servlets/DeflateServlet.java
index 13af91624e..22cf4ea453 100644
--- a/src/test/java/org/jsoup/integration/servlets/Deflateservlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/DeflateServlet.java
@@ -9,11 +9,17 @@
 import java.util.zip.Deflater;
 import java.util.zip.DeflaterOutputStream;
 
-public class Deflateservlet extends BaseServlet {
-    public static final String Url = TestServer.map(Deflateservlet.class);
+public class DeflateServlet extends BaseServlet {
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(DeflateServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
 
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         res.setContentType(TextHtml);
         res.setStatus(HttpServletResponse.SC_OK);
         res.setHeader("Content-Encoding", "deflate");
diff --git a/src/test/java/org/jsoup/integration/servlets/EchoServlet.java b/src/test/java/org/jsoup/integration/servlets/EchoServlet.java
index c3a9c44a3f..6ff31a2a0d 100644
--- a/src/test/java/org/jsoup/integration/servlets/EchoServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/EchoServlet.java
@@ -22,30 +22,17 @@
 
 public class EchoServlet extends BaseServlet {
     public static final String CodeParam = "code";
-    public static final String Url = TestServer.map(EchoServlet.class);
     private static final int DefaultCode = HttpServletResponse.SC_OK;
-
-    @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
-    }
-
-    @Override
-    protected void doPost(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(EchoServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
     }
 
     @Override
-    protected void doPut(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
-    }
-
-    @Override
-    protected void doDelete(HttpServletRequest req, HttpServletResponse res) throws ServletException, IOException {
-        doIt(req, res);
-    }
-
-    private void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException, ServletException {
         int intCode = DefaultCode;
         String code = req.getHeader(CodeParam);
         if (code != null)
@@ -133,7 +120,7 @@ static void write(PrintWriter w, String key, String val) {
     // allow the servlet to run as a main program, for local test
     public static void main(String[] args) {
         TestServer.start();
-        System.out.println(Url);
+        System.out.println("Listening on " + Url + " and " + TlsUrl);
     }
 
     private static boolean maybeEnableMultipart(HttpServletRequest req) {
diff --git a/src/test/java/org/jsoup/integration/servlets/FileServlet.java b/src/test/java/org/jsoup/integration/servlets/FileServlet.java
index 7447e8c777..a97c43e69d 100644
--- a/src/test/java/org/jsoup/integration/servlets/FileServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/FileServlet.java
@@ -11,12 +11,18 @@
 import java.nio.file.Files;
 
 public class FileServlet extends BaseServlet {
-    public static final String Url = TestServer.map(FileServlet.class);
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(FileServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
     public static final String ContentTypeParam = "contentType";
     public static final String DefaultType = "text/html";
 
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         String contentType = req.getParameter(ContentTypeParam);
         if (contentType == null)
             contentType = DefaultType;
@@ -33,7 +39,7 @@ protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOE
             Files.copy(file.toPath(), out);
             out.flush();
         } else {
-            res.setStatus(HttpServletResponse.SC_NOT_FOUND);
+            res.sendError(HttpServletResponse.SC_NOT_FOUND);
         }
     }
 
@@ -41,8 +47,7 @@ public static String urlTo(String path) {
         return Url + path;
     }
 
-    @Override
-    protected void doPost(HttpServletRequest req, HttpServletResponse res) throws IOException {
-        doGet(req, res);
+    public static String tlsUrlTo(String path) {
+        return TlsUrl + path;
     }
 }
diff --git a/src/test/java/org/jsoup/integration/servlets/HelloServlet.java b/src/test/java/org/jsoup/integration/servlets/HelloServlet.java
index 7a7924c775..aaae1fa706 100644
--- a/src/test/java/org/jsoup/integration/servlets/HelloServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/HelloServlet.java
@@ -7,10 +7,16 @@
 import java.io.IOException;
 
 public class HelloServlet extends BaseServlet {
-    public static final String Url = TestServer.map(HelloServlet.class);
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(HelloServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
 
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         res.setContentType(TextHtml);
         res.setStatus(HttpServletResponse.SC_OK);
 
diff --git a/src/test/java/org/jsoup/integration/servlets/InterruptedServlet.java b/src/test/java/org/jsoup/integration/servlets/InterruptedServlet.java
index 22180e13d5..26b2fef9f5 100644
--- a/src/test/java/org/jsoup/integration/servlets/InterruptedServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/InterruptedServlet.java
@@ -8,13 +8,18 @@
 import java.io.IOException;
 
 public class InterruptedServlet extends BaseServlet {
-    public static final String Url = TestServer.map(InterruptedServlet.class);
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(InterruptedServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
     public static final String Magnitude = "magnitude";
     public static final String Larger = "larger";
 
-
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         String magnitude = req.getParameter(Magnitude);
         magnitude  = magnitude == null ? "" : magnitude;
         res.setContentType(TextHtml);
diff --git a/src/test/java/org/jsoup/integration/servlets/ProxyServlet.java b/src/test/java/org/jsoup/integration/servlets/ProxyServlet.java
new file mode 100644
index 0000000000..bdd360bcf2
--- /dev/null
+++ b/src/test/java/org/jsoup/integration/servlets/ProxyServlet.java
@@ -0,0 +1,69 @@
+package org.jsoup.integration.servlets;
+
+import org.eclipse.jetty.client.api.Response;
+import org.eclipse.jetty.proxy.AsyncProxyServlet;
+import org.eclipse.jetty.proxy.ConnectHandler;
+import org.eclipse.jetty.server.Handler;
+import org.eclipse.jetty.servlet.FilterHolder;
+import org.eclipse.jetty.servlet.FilterMapping;
+import org.eclipse.jetty.servlet.ServletHandler;
+import org.eclipse.jetty.servlet.ServletHolder;
+import org.jsoup.integration.TestServer;
+
+import javax.servlet.http.HttpServletRequest;
+import javax.servlet.http.HttpServletResponse;
+
+import static org.jsoup.integration.servlets.AuthFilter.ProxyRealm;
+
+public class ProxyServlet extends AsyncProxyServlet {
+    public static TestServer.ProxySettings ProxySettings = TestServer.proxySettings();
+    public static String Via = "1.1 jsoup test proxy";
+
+    static {
+        System.setProperty("jdk.http.auth.tunneling.disabledSchemes", "");
+        // removes Basic, which is otherwise excluded from auth for CONNECT tunnels
+    }
+
+    public static Handler createHandler(boolean alwaysAuth) {
+        // ConnectHandler wraps this ProxyServlet and handles CONNECT, which sets up a tunnel for HTTPS requests and is
+        // opaque to the proxy. The ProxyServlet handles simple HTTP requests.
+        AuthFilter authFilter = new AuthFilter(alwaysAuth, true);
+        ConnectHandler connectHandler = new ConnectProxy(authFilter);
+        ServletHandler proxyHandler = new ServletHandler();
+        proxyHandler.addFilterWithMapping(new FilterHolder(authFilter), "/*", FilterMapping.ALL); // auth for HTTP proxy
+        ServletHolder proxyServletHolder = new ServletHolder(ProxyServlet.class); // Holder wraps as it requires maxThreads initialization
+        proxyServletHolder.setAsyncSupported(true);
+        proxyServletHolder.setInitParameter("maxThreads", "8");
+        proxyHandler.addServletWithMapping(proxyServletHolder, "/*");
+        connectHandler.setHandler(proxyHandler);
+
+        return connectHandler;
+    }
+
+    @Override
+    protected void onServerResponseHeaders(HttpServletRequest clientRequest, HttpServletResponse proxyResponse, Response serverResponse) {
+        super.onServerResponseHeaders(clientRequest, proxyResponse, serverResponse);
+        proxyResponse.addHeader("Via", Via);
+    }
+
+    /** Supports CONNECT tunnels */
+    static class ConnectProxy extends ConnectHandler {
+        final AuthFilter authFilter;
+
+        public ConnectProxy(AuthFilter authFilter) {
+            this.authFilter = authFilter;
+        }
+
+        @Override
+        protected boolean handleAuthentication(HttpServletRequest req, HttpServletResponse res, String address) {
+            boolean accessGranted = authFilter.checkAuth(req);
+            //System.err.println("CONNECT AUTH: " + accessGranted);
+
+            // need to add the desired auth header if not granted. Returning false here will also send 407 header
+            if (!accessGranted) {
+                res.setHeader("Proxy-Authenticate", "Basic realm=\"" + ProxyRealm + "\"");
+            }
+            return accessGranted;
+        }
+    }
+}
diff --git a/src/test/java/org/jsoup/integration/servlets/RedirectServlet.java b/src/test/java/org/jsoup/integration/servlets/RedirectServlet.java
index 5ab52a0bd5..0a937b772f 100644
--- a/src/test/java/org/jsoup/integration/servlets/RedirectServlet.java
+++ b/src/test/java/org/jsoup/integration/servlets/RedirectServlet.java
@@ -5,16 +5,23 @@
 import javax.servlet.http.Cookie;
 import javax.servlet.http.HttpServletRequest;
 import javax.servlet.http.HttpServletResponse;
+import java.io.IOException;
 
 public class RedirectServlet extends BaseServlet {
-    public static final String Url = TestServer.map(RedirectServlet.class);
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(RedirectServlet.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
     public static final String LocationParam = "loc";
     public static final String CodeParam = "code";
     public static final String SetCookiesParam = "setCookies";
     private static final int DefaultCode = HttpServletResponse.SC_MOVED_TEMPORARILY;
 
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         String location = req.getParameter(LocationParam);
         if (location == null)
             location = "";
@@ -31,10 +38,7 @@ protected void doGet(HttpServletRequest req, HttpServletResponse res) {
 
         res.setHeader("Location", location);
         res.setStatus(intCode);
+        res.flushBuffer();
     }
 
-    @Override
-    protected void doPost(HttpServletRequest req, HttpServletResponse res) {
-        doGet(req, res);
-    }
 }
diff --git a/src/test/java/org/jsoup/integration/servlets/SlowRider.java b/src/test/java/org/jsoup/integration/servlets/SlowRider.java
index e8db460073..7298e0b346 100644
--- a/src/test/java/org/jsoup/integration/servlets/SlowRider.java
+++ b/src/test/java/org/jsoup/integration/servlets/SlowRider.java
@@ -11,12 +11,18 @@
  * Slowly, interminably writes output. For the purposes of testing timeouts and interrupts.
  */
 public class SlowRider extends BaseServlet {
-    public static final String Url = TestServer.map(SlowRider.class);
+    public static final String Url;
+    public static final String TlsUrl;
+    static {
+        TestServer.ServletUrls urls = TestServer.map(SlowRider.class);
+        Url = urls.url;
+        TlsUrl = urls.tlsUrl;
+    }
     private static final int SleepTime = 2000;
     public static final String MaxTimeParam = "maxTime";
 
     @Override
-    protected void doGet(HttpServletRequest req, HttpServletResponse res) throws IOException {
+    protected void doIt(HttpServletRequest req, HttpServletResponse res) throws IOException {
         pause(1000);
         res.setContentType(TextHtml);
         res.setStatus(HttpServletResponse.SC_OK);
diff --git a/src/test/java/org/jsoup/nodes/AttributesTest.java b/src/test/java/org/jsoup/nodes/AttributesTest.java
index bb415c0e00..f81ef322e1 100644
--- a/src/test/java/org/jsoup/nodes/AttributesTest.java
+++ b/src/test/java/org/jsoup/nodes/AttributesTest.java
@@ -7,6 +7,7 @@
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
+import java.util.NoSuchElementException;
 
 import static org.junit.jupiter.api.Assertions.*;
 
@@ -143,6 +144,29 @@ public void testIteratorSkipsInternal() {
         assertEquals(2, seen);
     }
 
+    @Test void iteratorThrows() {
+        Attributes attrs = new Attributes();
+        attrs.put("One", "one").put("Two", "two");
+
+        Iterator<Attribute> it = attrs.iterator();
+        int seen = 0;
+        while (it.hasNext()) {
+            it.next();
+            seen++;
+        }
+        assertFalse(it.hasNext());
+        assertEquals(2, seen);
+
+        boolean threw = false;
+        try {
+            Attribute next = it.next();
+            assertNotNull(next); // not hit
+        } catch (NoSuchElementException e) {
+            threw = true;
+        }
+        assertTrue(threw);
+    }
+
     @Test
     public void testListSkipsInternal() {
         Attributes a = new Attributes();
diff --git a/src/test/java/org/jsoup/nodes/ElementTest.java b/src/test/java/org/jsoup/nodes/ElementTest.java
index bba0940fc1..12a51a653f 100644
--- a/src/test/java/org/jsoup/nodes/ElementTest.java
+++ b/src/test/java/org/jsoup/nodes/ElementTest.java
@@ -208,6 +208,18 @@ public void testWholeText() {
         assertEquals("Hello  \n  there", doc.wholeText());
     }
 
+    @Test void wholeTextRuns() {
+        Document doc = Jsoup.parse("<div><p id=1></p><p id=2> </p><p id=3>.  </p>");
+
+        Element p1 = doc.expectFirst("#1");
+        Element p2 = doc.expectFirst("#2");
+        Element p3 = doc.expectFirst("#3");
+
+        assertEquals("", p1.wholeText());
+        assertEquals(" ", p2.wholeText());
+        assertEquals(".  ", p3.wholeText());
+    }
+
     @Test
     public void testGetSiblings() {
         Document doc = Jsoup.parse("<div><p>Hello<p id=1>there<p>this<p>is<p>an<p id=last>element</div>");
@@ -2733,6 +2745,28 @@ void prettySerializationRoundTrips(Document.OutputSettings settings) {
         assertEquals("Hello", parse.data());
     }
 
+    @Test void datanodesOutputCdataInXhtml() {
+        String html = "<p><script>1 && 2</script><style>3 && 4</style> 5 &amp;&amp; 6</p>";
+        Document doc = Jsoup.parse(html); // parsed as HTML
+        String out = TextUtil.normalizeSpaces(doc.body().html());
+        assertEquals(html, out);
+        Element scriptEl = doc.expectFirst("script");
+        DataNode scriptDataNode = (DataNode) scriptEl.childNode(0);
+        assertEquals("1 && 2", scriptDataNode.getWholeData());
+
+        doc.outputSettings().syntax(Document.OutputSettings.Syntax.xml);
+        String xml = doc.body().html();
+        assertEquals(
+            "<p><script><![CDATA[1 && 2]]></script><style><![CDATA[3 && 4]]></style> 5 &amp;&amp; 6</p>",
+            TextUtil.normalizeSpaces(xml));
+
+        Document xmlDoc = Jsoup.parse(xml, Parser.xmlParser());
+        assertEquals(xml, xmlDoc.html());
+        Element scriptXmlEl = xmlDoc.expectFirst("script");
+        CDataNode scriptCdata = (CDataNode) scriptXmlEl.childNode(0);
+        assertEquals(scriptCdata.text(), scriptDataNode.getWholeData());
+    }
+
     @Test void outerHtmlAppendable() {
         // tests not string builder flow
         Document doc = Jsoup.parse("<div>One</div>");
@@ -2816,4 +2850,19 @@ void prettySerializationRoundTrips(Document.OutputSettings settings) {
 
         assertEquals("<p>One</p>", header.html());
     }
+
+    @Test void xmlSyntaxSetsEscapeMode() {
+        String html = "Foo&nbsp;&Succeeds;";
+        Document doc = Jsoup.parse(html);
+        doc.outputSettings().charset("ascii"); // so we can see the zws
+        assertEquals("Foo&nbsp;&#x227b;", doc.body().html());
+
+        doc.outputSettings().syntax(Document.OutputSettings.Syntax.xml);
+        String out = doc.body().html();
+        assertEquals("Foo&#xa0;&#x227b;", out);
+
+        // can set back if desired
+        doc.outputSettings().escapeMode(Entities.EscapeMode.extended);
+        assertEquals("Foo&nbsp;&succ;", doc.body().html()); // succ is alias for Succeeds, and first hit in entities
+    }
 }
diff --git a/src/test/java/org/jsoup/nodes/NodeIteratorTest.java b/src/test/java/org/jsoup/nodes/NodeIteratorTest.java
new file mode 100644
index 0000000000..ab7e9345e5
--- /dev/null
+++ b/src/test/java/org/jsoup/nodes/NodeIteratorTest.java
@@ -0,0 +1,266 @@
+package org.jsoup.nodes;
+
+import org.jsoup.Jsoup;
+import org.junit.jupiter.api.Test;
+
+import java.util.NoSuchElementException;
+
+import static org.junit.jupiter.api.Assertions.*;
+
+class NodeIteratorTest {
+    String html = "<div id=1><p>One<p>Two</div><div id=2><p>Three<p>Four</div>";
+
+    @Test void canIterateNodes() {
+        Document doc = Jsoup.parse(html);
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        assertIterates(it, "#root;html;head;body;div#1;p;One;p;Two;div#2;p;Three;p;Four;");
+        // todo - need to review that the Document object #root holds the html element as child. Why not have document root == html element?
+        assertFalse(it.hasNext());
+
+        boolean threw = false;
+        try {
+            it.next();
+        } catch (NoSuchElementException e) {
+            threw = true;
+        }
+        assertTrue(threw);
+    }
+
+    @Test void hasNextIsPure() {
+        Document doc = Jsoup.parse(html);
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        assertTrue(it.hasNext());
+        assertTrue(it.hasNext());
+        assertIterates(it, "#root;html;head;body;div#1;p;One;p;Two;div#2;p;Three;p;Four;");
+        assertFalse(it.hasNext());
+    }
+
+    @Test void iterateSubTree() {
+        Document doc = Jsoup.parse(html);
+
+        Element div1 = doc.expectFirst("div#1");
+        NodeIterator<Node> it = NodeIterator.from(div1);
+        assertIterates(it, "div#1;p;One;p;Two;");
+        assertFalse(it.hasNext());
+
+        Element div2 = doc.expectFirst("div#2");
+        NodeIterator<Node> it2 = NodeIterator.from(div2);
+        assertIterates(it2, "div#2;p;Three;p;Four;");
+        assertFalse(it2.hasNext());
+    }
+
+    @Test void canRestart() {
+        Document doc = Jsoup.parse(html);
+
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        assertIterates(it, "#root;html;head;body;div#1;p;One;p;Two;div#2;p;Three;p;Four;");
+
+        it.restart(doc.expectFirst("div#2"));
+        assertIterates(it, "div#2;p;Three;p;Four;");
+    }
+
+    @Test void canIterateJustOneSibling() {
+        Document doc = Jsoup.parse(html);
+        Element p2 = doc.expectFirst("p:contains(Two)");
+        assertEquals("Two", p2.text());
+
+        NodeIterator<Node> it = NodeIterator.from(p2);
+        assertIterates(it, "p;Two;");
+
+        NodeIterator<Element> elIt = new NodeIterator<>(p2, Element.class);
+        Element found = elIt.next();
+        assertSame(p2, found);
+        assertFalse(elIt.hasNext());
+    }
+
+    @Test void canIterateFirstEmptySibling() {
+        Document doc = Jsoup.parse("<div><p id=1></p><p id=2>.</p><p id=3>..</p>");
+        Element p1 = doc.expectFirst("p#1");
+        assertEquals("", p1.ownText());
+
+        NodeIterator<Node> it = NodeIterator.from(p1);
+        assertTrue(it.hasNext());
+        Node node = it.next();
+        assertSame(p1, node);
+        assertFalse(it.hasNext());
+    }
+
+    @Test void canRemoveViaIterator() {
+        String html = "<div id=out1><div id=1><p>One<p>Two</div><div id=2><p>Three<p>Four</div></div><div id=out2>Out2";
+        Document doc = Jsoup.parse(html);
+
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        StringBuilder seen = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            if (node.attr("id").equals("1"))
+                it.remove();
+            trackSeen(node, seen);
+        }
+        assertEquals("#root;html;head;body;div#out1;div#1;div#2;p;Three;p;Four;div#out2;Out2;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#out1;div#2;p;Three;p;Four;div#out2;Out2;");
+
+        it = NodeIterator.from(doc);
+        seen = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            if (node.attr("id").equals("2"))
+                it.remove();
+            trackSeen(node, seen);
+        }
+        assertEquals("#root;html;head;body;div#out1;div#2;div#out2;Out2;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#out1;div#out2;Out2;");
+    }
+
+    @Test void canRemoveViaNode() {
+        String html = "<div id=out1><div id=1><p>One<p>Two</div><div id=2><p>Three<p>Four</div></div><div id=out2>Out2";
+        Document doc = Jsoup.parse(html);
+
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        StringBuilder seen = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            if (node.attr("id").equals("1"))
+                node.remove();
+            trackSeen(node, seen);
+        }
+        assertEquals("#root;html;head;body;div#out1;div#1;div#2;p;Three;p;Four;div#out2;Out2;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#out1;div#2;p;Three;p;Four;div#out2;Out2;");
+
+        it = NodeIterator.from(doc);
+        seen = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            if (node.attr("id").equals("2"))
+                node.remove();
+            trackSeen(node, seen);
+        }
+        assertEquals("#root;html;head;body;div#out1;div#2;div#out2;Out2;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#out1;div#out2;Out2;");
+    }
+
+    @Test void canReplace() {
+        String html = "<div id=out1><div id=1><p>One<p>Two</div><div id=2><p>Three<p>Four</div></div><div id=out2>Out2";
+        Document doc = Jsoup.parse(html);
+
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        StringBuilder seen = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            trackSeen(node, seen);
+            if (node.attr("id").equals("1")) {
+                node.replaceWith(new Element("span").text("Foo"));
+            }
+        }
+        assertEquals("#root;html;head;body;div#out1;div#1;span;Foo;div#2;p;Three;p;Four;div#out2;Out2;", seen.toString());
+        // ^^ we don't see <p>One, do see the replaced in <span>, and the subsequent nodes
+        assertContents(doc, "#root;html;head;body;div#out1;span;Foo;div#2;p;Three;p;Four;div#out2;Out2;");
+
+        it = NodeIterator.from(doc);
+        seen = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            trackSeen(node, seen);
+            if (node.attr("id").equals("2")) {
+                node.replaceWith(new Element("span").text("Bar"));
+            }
+        }
+        assertEquals("#root;html;head;body;div#out1;span;Foo;div#2;span;Bar;div#out2;Out2;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#out1;span;Foo;span;Bar;div#out2;Out2;");
+    }
+
+    @Test void canWrap() {
+        Document doc = Jsoup.parse(html);
+        NodeIterator<Node> it = NodeIterator.from(doc);
+        boolean sawInner = false;
+        while (it.hasNext()) {
+            Node node = it.next();
+            if (node.attr("id").equals("1")) {
+                node.wrap("<div id=outer>");
+            }
+            if (node instanceof TextNode && ((TextNode) node).text().equals("One"))
+                sawInner = true;
+        }
+        assertContents(doc, "#root;html;head;body;div#outer;div#1;p;One;p;Two;div#2;p;Three;p;Four;");
+        assertTrue(sawInner);
+    }
+
+    @Test void canFilterForElements() {
+        Document doc = Jsoup.parse(html);
+        NodeIterator<Element> it = new NodeIterator<>(doc, Element.class);
+
+        StringBuilder seen = new StringBuilder();
+        while (it.hasNext()) {
+            Element el = it.next();
+            assertNotNull(el);
+            trackSeen(el, seen);
+        }
+
+        assertEquals("#root;html;head;body;div#1;p;p;div#2;p;p;", seen.toString());
+    }
+
+    @Test void canFilterForTextNodes() {
+        Document doc = Jsoup.parse(html);
+        NodeIterator<TextNode> it = new NodeIterator<>(doc, TextNode.class);
+
+        StringBuilder seen = new StringBuilder();
+        while (it.hasNext()) {
+            TextNode text = it.next();
+            assertNotNull(text);
+            trackSeen(text, seen);
+        }
+
+        assertEquals("One;Two;Three;Four;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#1;p;One;p;Two;div#2;p;Three;p;Four;");
+    }
+
+    @Test void canModifyFilteredElements() {
+        Document doc = Jsoup.parse(html);
+        NodeIterator<Element> it = new NodeIterator<>(doc, Element.class);
+
+        StringBuilder seen = new StringBuilder();
+        while (it.hasNext()) {
+            Element el = it.next();
+            if (!el.ownText().isEmpty())
+                el.text(el.ownText() + "++");
+            trackSeen(el, seen);
+        }
+
+        assertEquals("#root;html;head;body;div#1;p;p;div#2;p;p;", seen.toString());
+        assertContents(doc, "#root;html;head;body;div#1;p;One++;p;Two++;div#2;p;Three++;p;Four++;");
+    }
+
+    static <T extends Node> void assertIterates(NodeIterator<T> it, String expected) {
+        Node previous = null;
+        StringBuilder actual = new StringBuilder();
+        while (it.hasNext()) {
+            Node node = it.next();
+            assertNotNull(node);
+            assertNotSame(previous, node);
+
+            trackSeen(node, actual);
+            previous = node;
+        }
+        assertEquals(expected, actual.toString());
+    }
+
+    static void assertContents(Element el, String expected) {
+        NodeIterator<Node> it = NodeIterator.from(el);
+        assertIterates(it, expected);
+    }
+
+    static void trackSeen(Node node, StringBuilder actual) {
+        if (node instanceof Element) {
+            Element el = (Element) node;
+            actual.append(el.tagName());
+            if (el.hasAttr("id"))
+                actual.append("#").append(el.id());
+        }
+        else if (node instanceof TextNode)
+            actual.append(((TextNode) node).text());
+        else
+            actual.append(node.nodeName());
+        actual.append(";");
+    }
+
+}
\ No newline at end of file
diff --git a/src/test/java/org/jsoup/nodes/NodeStreamTest.java b/src/test/java/org/jsoup/nodes/NodeStreamTest.java
new file mode 100644
index 0000000000..b8aadaf83f
--- /dev/null
+++ b/src/test/java/org/jsoup/nodes/NodeStreamTest.java
@@ -0,0 +1,70 @@
+package org.jsoup.nodes;
+
+import org.jsoup.Jsoup;
+import org.junit.jupiter.api.Test;
+
+import java.util.Optional;
+import java.util.stream.Stream;
+
+import static org.jsoup.nodes.NodeIteratorTest.trackSeen;
+import static org.jsoup.nodes.NodeIteratorTest.assertContents;
+import static org.junit.jupiter.api.Assertions.*;
+
+public class NodeStreamTest {
+
+    String html = "<div id=1><p>One<p>Two</div><div id=2><p>Three<p>Four</div>";
+
+
+    @Test void canStream() {
+        Document doc = Jsoup.parse(html);
+        StringBuilder seen = new StringBuilder();
+        Stream<Node> stream = doc.nodeStream();
+        stream.forEachOrdered(node -> trackSeen(node, seen));
+        assertEquals("#root;html;head;body;div#1;p;One;p;Two;div#2;p;Three;p;Four;", seen.toString());
+    }
+
+    @Test void canStreamParallel() {
+        Document doc = Jsoup.parse(html);
+        long count = doc.nodeStream().parallel().count();
+        assertEquals(14, count);
+    }
+
+    @Test void canFindFirst() {
+        Document doc = Jsoup.parse(html);
+        Optional<Node> first = doc.nodeStream().findFirst();
+        assertTrue(first.isPresent());
+        assertSame(doc, first.get());
+    }
+
+    @Test void canFilter() {
+        Document doc = Jsoup.parse(html);
+        StringBuilder seen = new StringBuilder();
+
+        doc.nodeStream()
+            .filter(node -> node instanceof TextNode)
+            .forEach(node -> trackSeen(node, seen));
+
+        assertEquals("One;Two;Three;Four;", seen.toString());
+    }
+
+    @Test void canRemove() {
+        String html = "<div id=1><p>One<p>Two</div><div id=2><p>Three<p>Four</div><div id=3><p>Five";
+        Document doc = Jsoup.parse(html);
+
+        doc.nodeStream()
+            .filter(node -> node instanceof Element)
+                .filter(node -> node.attr("id").equals("1") || node.attr("id").equals("2"))
+                    .forEach(Node::remove);
+
+        assertContents(doc, "#root;html;head;body;div#3;p;Five;");
+    }
+
+    @Test void elementStream() {
+        Document doc = Jsoup.parse(html);
+        StringBuilder seen = new StringBuilder();
+        Stream<Element> stream = doc.stream();
+        stream.forEachOrdered(node -> trackSeen(node, seen));
+        assertEquals("#root;html;head;body;div#1;p;p;div#2;p;p;", seen.toString());
+    }
+
+}
diff --git a/src/test/java/org/jsoup/nodes/PositionTest.java b/src/test/java/org/jsoup/nodes/PositionTest.java
index 1db73c9e97..ee6f49d79f 100644
--- a/src/test/java/org/jsoup/nodes/PositionTest.java
+++ b/src/test/java/org/jsoup/nodes/PositionTest.java
@@ -4,12 +4,11 @@
 import org.jsoup.integration.servlets.FileServlet;
 import org.jsoup.parser.Parser;
 import org.jsoup.select.Elements;
-import org.jsoup.select.NodeTraversor;
 import org.junit.jupiter.api.Test;
 
 import java.io.IOException;
-import java.util.ArrayList;
 import java.util.List;
+import java.util.stream.Collectors;
 
 import static org.junit.jupiter.api.Assertions.*;
 
@@ -32,9 +31,10 @@ class PositionTest {
     }
 
     @Test void tracksPosition() {
-        String html = "<p id=1\n class=foo>\n<span>Hello\n &reg;\n there &copy.</span> now.\n <!-- comment --> ";
-        Document doc = Jsoup.parse(html, TrackingParser);
+        String content = "<p id=1\n class=foo>\n<span>Hello\n &reg;\n there &copy.</span> now.\n <!-- comment --> ";
+        Document doc = Jsoup.parse(content, TrackingParser);
 
+        Element html = doc.expectFirst("html");
         Element body = doc.expectFirst("body");
         Element p = doc.expectFirst("p");
         Element span = doc.expectFirst("span");
@@ -45,14 +45,28 @@ class PositionTest {
         Comment comment = (Comment) now.nextSibling();
         assertNotNull(comment);
 
-        assertFalse(body.sourceRange().isTracked());
+        // implicit
+        assertTrue(body.sourceRange().isTracked());
+        assertTrue(body.endSourceRange().isTracked());
+        assertTrue(body.sourceRange().isImplicit());
+        assertTrue(body.endSourceRange().isImplicit());
+        Range htmlRange = html.sourceRange();
+        assertEquals("1,1:0-1,1:0", htmlRange.toString());
+        assertEquals(htmlRange, body.sourceRange());
+        assertEquals(html.endSourceRange(), body.endSourceRange());
+
 
         Range pRange = p.sourceRange();
         assertEquals("1,1:0-2,12:19", pRange.toString());
+        assertFalse(pRange.isImplicit());
+        assertTrue(p.endSourceRange().isImplicit());
+        assertEquals("6,19:83-6,19:83", p.endSourceRange().toString());
+        assertEquals(p.endSourceRange(), html.endSourceRange());
 
         // no explicit P closer
         Range pEndRange = p.endSourceRange();
-        assertFalse(pEndRange.isTracked());
+        assertTrue(pEndRange.isTracked());
+        assertTrue(pEndRange.isImplicit());
 
         Range.Position pStart = pRange.start();
         assertTrue(pStart.isTracked());
@@ -88,6 +102,76 @@ class PositionTest {
         assertEquals("6,18:82", comment.sourceRange().end().toString());
     }
 
+    @Test void tracksExpectedPoppedElements() {
+        // When TreeBuilder hits a direct .pop(), vs popToClose(..)
+        String html = "<html><head><meta></head><body><img><p>One</p><p>Two</p></body></html>";
+        Document doc = Jsoup.parse(html, TrackingParser);
+
+        StringBuilder track = new StringBuilder();
+        doc.expectFirst("html").stream().forEach(el -> {
+            accumulatePositions(el, track);
+            assertTrue(el.sourceRange().isTracked(), el.tagName());
+            assertTrue(el.endSourceRange().isTracked(), el.tagName());
+            assertFalse(el.sourceRange().isImplicit(), el.tagName());
+            assertFalse(el.endSourceRange().isImplicit(), el.tagName());
+        });
+        assertEquals("html:0-6~63-70; head:6-12~18-25; meta:12-18~12-18; body:25-31~56-63; img:31-36~31-36; p:36-39~42-46; p:46-49~52-56; ", track.toString());
+
+        StringBuilder textTrack = new StringBuilder();
+        doc.nodeStream(TextNode.class).forEach(text -> accumulatePositions(text, textTrack));
+        assertEquals("#text:39-42; #text:49-52; ", textTrack.toString());
+    }
+
+    static void accumulatePositions(Node node, StringBuilder sb) {
+        sb
+            .append(node.nodeName())
+            .append(':')
+            .append(node.sourceRange().startPos())
+            .append('-')
+            .append(node.sourceRange().endPos());
+
+        if (node instanceof Element) {
+            Element el = (Element) node;
+            sb
+                .append("~")
+                .append(el.endSourceRange().startPos())
+                .append('-')
+                .append(el.endSourceRange().endPos());
+        }
+        sb.append("; ");
+    }
+
+    @Test void tracksImplicitPoppedElements() {
+        // When TreeBuilder hits a direct .pop(), vs popToClose(..)
+        String html = "<meta><img><p>One<p>Two<p>Three";
+        Document doc = Jsoup.parse(html, TrackingParser);
+
+        StringBuilder track = new StringBuilder();
+        doc.expectFirst("html").stream().forEach(el -> {
+            assertTrue(el.sourceRange().isTracked());
+            assertTrue(el.endSourceRange().isTracked());
+            accumulatePositions(el, track);
+        });
+
+        assertTrue(doc.expectFirst("p").endSourceRange().isImplicit());
+        assertFalse(doc.expectFirst("meta").endSourceRange().isImplicit());
+        assertEquals("html:0-0~31-31; head:0-0~6-6; meta:0-6~0-6; body:6-6~31-31; img:6-11~6-11; p:11-14~17-17; p:17-20~23-23; p:23-26~31-31; ", track.toString());
+    }
+    private void printRange(Node node) {
+        if (node instanceof Element) {
+            Element el = (Element) node;
+            System.out.println(el.tagName() + "\t"
+                + el.sourceRange().start().pos() + "-" + el.sourceRange().end().pos()
+                + "\t... "
+                + el.endSourceRange().start().pos() + "-" + el.endSourceRange().end().pos()
+            );
+        } else {
+            System.out.println(node.nodeName() + "\t"
+                + node.sourceRange().start().pos() + "-" + node.sourceRange().end().pos()
+            );
+        }
+    }
+
     @Test void tracksMarkup() {
         String html = "<!doctype\nhtml>\n<title>jsoup &copy;\n2022</title><body>\n<![CDATA[\n<jsoup>\n]]>";
         Document doc = Jsoup.parse(html, TrackingParser);
@@ -177,19 +261,19 @@ class PositionTest {
         String html = "<table>foo<tr>bar<td>baz</td>qux</tr>coo</table>";
         Document doc = Jsoup.parse(html, TrackingParser);
 
-        List<TextNode> textNodes = new ArrayList<>();
-        NodeTraversor.traverse((Node node, int depth) -> {
-            if (node instanceof TextNode) {
-                textNodes.add((TextNode) node);
-            }
-        }, doc);
+        StringBuilder track = new StringBuilder();
+        List<TextNode> textNodes = doc.nodeStream(TextNode.class)
+            .peek(node -> accumulatePositions(node, track))
+            .collect(Collectors.toList());
 
         assertEquals(5, textNodes.size());
-        assertEquals("1,8:7-1,11:10", textNodes.get(0).sourceRange().toString());
-        assertEquals("1,15:14-1,18:17", textNodes.get(1).sourceRange().toString());
-        assertEquals("1,22:21-1,25:24", textNodes.get(2).sourceRange().toString());
-        assertEquals("1,30:29-1,33:32", textNodes.get(3).sourceRange().toString());
-        assertEquals("1,38:37-1,41:40", textNodes.get(4).sourceRange().toString());
+        assertEquals("foo", textNodes.get(0).text());
+        assertEquals("bar", textNodes.get(1).text());
+        assertEquals("baz", textNodes.get(2).text());
+        assertEquals("qux", textNodes.get(3).text());
+        assertEquals("coo", textNodes.get(4).text());
+
+        assertEquals("#text:7-10; #text:14-17; #text:21-24; #text:29-32; #text:37-40; ", track.toString());
     }
 
     @Test void tracksClosingHtmlTagsInXml() {
@@ -219,4 +303,76 @@ class PositionTest {
         assertEquals("1,20:19-1,25:24", h2.endSourceRange().toString());
     }
 
+    @Test void tracksAttributes() {
+        String html = "<div one=\"Hello there\" id=1 class=foo attr1 = \"bar &amp; qux\" attr2='val &gt x' attr3=\"\" attr4 attr5>Text";
+        Document doc = Jsoup.parse(html, TrackingParser);
+
+        Element div = doc.expectFirst("div");
+
+        StringBuilder track = new StringBuilder();
+        for (Attribute attr : div.attributes()) {
+
+            Range.AttributeRange attrRange = attr.sourceRange();
+            assertTrue(attrRange.nameRange().isTracked());
+            assertTrue(attrRange.valueRange().isTracked());
+            assertSame(attrRange, div.attributes().sourceRange(attr.getKey()));
+
+            assertFalse(attrRange.nameRange().isImplicit());
+            if (attr.getValue().isEmpty())
+                assertTrue(attrRange.valueRange().isImplicit());
+            else
+                assertFalse(attrRange.valueRange().isImplicit());
+
+            accumulatePositions(attr, track);
+        }
+
+        System.out.println(track);
+        assertEquals("one:5-8=10-21; id:23-25=26-27; class:28-33=34-37; attr1:38-43=47-60; attr2:62-67=69-78; attr3:80-85=85-85; attr4:89-94=94-94; attr5:95-100=100-100; ", track.toString());
+    }
+
+    @Test void tracksAttributesAcrossLines() {
+        String html = "<div one=\"Hello\nthere\" \nid=1 \nclass=\nfoo\nattr5>Text";
+        Document doc = Jsoup.parse(html, TrackingParser);
+
+        Element div = doc.expectFirst("div");
+
+        StringBuilder track = new StringBuilder();
+        for (Attribute attr : div.attributes()) {
+            Range.AttributeRange attrRange = attr.sourceRange();
+            assertTrue(attrRange.nameRange().isTracked());
+            assertTrue(attrRange.valueRange().isTracked());
+            assertSame(attrRange, div.attributes().sourceRange(attr.getKey()));
+            assertFalse(attrRange.nameRange().isImplicit());
+            if (attr.getValue().isEmpty())
+                assertTrue(attrRange.valueRange().isImplicit());
+            else
+                assertFalse(attrRange.valueRange().isImplicit());
+            accumulatePositions(attr, track);
+        }
+
+        String value = div.attributes().get("class");
+        assertEquals("foo", value);
+        Range.AttributeRange foo = div.attributes().sourceRange("class");
+        assertEquals("4,1:30-4,6:35=5,1:37-5,4:40", foo.toString());
+
+        assertEquals("one:5-8=10-21; id:24-26=27-28; class:30-35=37-40; attr5:41-46=46-46; ", track.toString());
+    }
+
+    static void accumulatePositions(Attribute attr, StringBuilder sb) {
+        Range.AttributeRange range = attr.sourceRange();
+
+        sb
+            .append(attr.getKey())
+            .append(':')
+            .append(range.nameRange().startPos())
+            .append('-')
+            .append(range.nameRange().endPos())
+
+            .append('=')
+            .append(range.valueRange().startPos())
+            .append('-')
+            .append(range.valueRange().endPos());
+
+        sb.append("; ");
+    }
 }
\ No newline at end of file
diff --git a/src/test/java/org/jsoup/parser/CharacterReaderTest.java b/src/test/java/org/jsoup/parser/CharacterReaderTest.java
index 5aa9a58e74..7071bfe51d 100644
--- a/src/test/java/org/jsoup/parser/CharacterReaderTest.java
+++ b/src/test/java/org/jsoup/parser/CharacterReaderTest.java
@@ -433,14 +433,14 @@ public void notEmptyAtBufferSplitPoint() {
         assertEquals(12, noTrack.pos());
         assertEquals(1, noTrack.lineNumber());
         assertEquals(13, noTrack.columnNumber());
-        assertEquals("1:13", noTrack.cursorPos());
+        assertEquals("1:13", noTrack.posLineCol());
         // get over the buffer
         while (!noTrack.matches("[foo]"))
             noTrack.consumeTo("[foo]");
         assertEquals(32778, noTrack.pos());
         assertEquals(1, noTrack.lineNumber());
         assertEquals(noTrack.pos()+1, noTrack.columnNumber());
-        assertEquals("1:32779", noTrack.cursorPos());
+        assertEquals("1:32779", noTrack.posLineCol());
 
         // and the line numbers: "<foo>\n<bar>\n<qux>\n"
         assertEquals(0, track.pos());
@@ -462,24 +462,24 @@ public void notEmptyAtBufferSplitPoint() {
         assertEquals(12, track.pos());
         assertEquals(3, track.lineNumber());
         assertEquals(1, track.columnNumber());
-        assertEquals("3:1", track.cursorPos());
+        assertEquals("3:1", track.posLineCol());
         assertEquals("<qux>", track.consumeTo('\n'));
-        assertEquals("3:6", track.cursorPos());
+        assertEquals("3:6", track.posLineCol());
         // get over the buffer
         while (!track.matches("[foo]"))
             track.consumeTo("[foo]");
         assertEquals(32778, track.pos());
         assertEquals(4, track.lineNumber());
         assertEquals(32761, track.columnNumber());
-        assertEquals("4:32761", track.cursorPos());
+        assertEquals("4:32761", track.posLineCol());
         track.consumeTo('\n');
-        assertEquals("4:32766", track.cursorPos());
+        assertEquals("4:32766", track.posLineCol());
 
         track.consumeTo("[bar]");
         assertEquals(5, track.lineNumber());
-        assertEquals("5:1", track.cursorPos());
+        assertEquals("5:1", track.posLineCol());
         track.consumeToEnd();
-        assertEquals("5:6", track.cursorPos());
+        assertEquals("5:6", track.posLineCol());
     }
 
     @Test public void countsColumnsOverBufferWhenNoNewlines() {
@@ -490,7 +490,7 @@ public void notEmptyAtBufferSplitPoint() {
         CharacterReader reader = new CharacterReader(content);
         reader.trackNewlines(true);
 
-        assertEquals("1:1", reader.cursorPos());
+        assertEquals("1:1", reader.posLineCol());
         while (!reader.isEmpty())
             reader.consume();
         assertEquals(131096, reader.pos());
@@ -515,4 +515,32 @@ public void notEmptyAtBufferSplitPoint() {
         assertEquals(14, reader.columnNumber());
     }
 
+    @Test public void consumeDoubleQuotedAttributeConsumesThruSingleQuote() {
+        String html = "He'llo\" >";
+        CharacterReader r = new CharacterReader(html);
+        assertEquals("He'llo", r.consumeAttributeQuoted(false));
+        assertEquals('"', r.consume());
+    }
+
+    @Test public void consumeSingleQuotedAttributeConsumesThruDoubleQuote() {
+        String html = "He\"llo' >";
+        CharacterReader r = new CharacterReader(html);
+        assertEquals("He\"llo", r.consumeAttributeQuoted(true));
+        assertEquals('\'', r.consume());
+    }
+
+    @Test public void consumeDoubleQuotedAttributeConsumesThruSingleQuoteToAmp() {
+        String html = "He'llo &copy;\" >";
+        CharacterReader r = new CharacterReader(html);
+        assertEquals("He'llo ", r.consumeAttributeQuoted(false));
+        assertEquals('&', r.consume());
+    }
+
+    @Test public void consumeSingleQuotedAttributeConsumesThruDoubleQuoteToAmp() {
+        String html = "He\"llo &copy;' >";
+        CharacterReader r = new CharacterReader(html);
+        assertEquals("He\"llo ", r.consumeAttributeQuoted(true));
+        assertEquals('&', r.consume());
+    }
+
 }
diff --git a/src/test/java/org/jsoup/parser/HtmlTreeBuilderTest.java b/src/test/java/org/jsoup/parser/HtmlTreeBuilderTest.java
index dae8e4600f..dcd41b8804 100644
--- a/src/test/java/org/jsoup/parser/HtmlTreeBuilderTest.java
+++ b/src/test/java/org/jsoup/parser/HtmlTreeBuilderTest.java
@@ -1,14 +1,11 @@
 package org.jsoup.parser;
 
 
+import org.jspecify.annotations.NullMarked;
 import org.junit.jupiter.api.Test;
-
-import javax.annotation.Nonnull;
-import javax.annotation.ParametersAreNonnullByDefault;
 import java.io.Reader;
 import java.lang.annotation.Annotation;
 import java.lang.reflect.Method;
-import java.util.Arrays;
 import java.util.List;
 
 import static org.junit.jupiter.api.Assertions.*;
@@ -31,12 +28,10 @@ public void nonnull() {
     }
 
     @Test public void nonnullAssertions() throws NoSuchMethodException {
-        Method parseMethod = TreeBuilder.class.getDeclaredMethod("parse", Reader.class, String.class, Parser.class);
-        assertNotNull(parseMethod);
-        Annotation[] declaredAnnotations = parseMethod.getDeclaredAnnotations();
+        Annotation[] declaredAnnotations = TreeBuilder.class.getPackage().getDeclaredAnnotations();
         boolean seen = false;
         for (Annotation annotation : declaredAnnotations) {
-            if (annotation.annotationType().isAssignableFrom(ParametersAreNonnullByDefault.class))
+            if (annotation.annotationType().isAssignableFrom(NullMarked.class))
                 seen = true;
         }
 
diff --git a/src/test/java/org/jsoup/safety/CleanerTest.java b/src/test/java/org/jsoup/safety/CleanerTest.java
index d7c6371cbc..961a7636c2 100644
--- a/src/test/java/org/jsoup/safety/CleanerTest.java
+++ b/src/test/java/org/jsoup/safety/CleanerTest.java
@@ -9,7 +9,10 @@
 import org.jsoup.nodes.Range;
 import org.jsoup.parser.Parser;
 import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.ValueSource;
 
+import java.util.Arrays;
 import java.util.Locale;
 
 import static org.junit.jupiter.api.Assertions.*;
@@ -388,15 +391,47 @@ public void bailsIfRemovingProtocolThatsNotSet() {
     }
 
     @Test void preservesSourcePositionViaUserData() {
-        Document orig = Jsoup.parse("<script>xss</script>\n <p>Hello</p>", Parser.htmlParser().setTrackPosition(true));
+        Document orig = Jsoup.parse("<script>xss</script>\n <p id=1>Hello</p>", Parser.htmlParser().setTrackPosition(true));
         Element p = orig.expectFirst("p");
         Range origRange = p.sourceRange();
-        assertEquals("2,2:22-2,5:25", origRange.toString());
+        assertEquals("2,2:22-2,10:30", origRange.toString());
 
-        Document clean = new Cleaner(Safelist.relaxed()).clean(orig);
+        Range.AttributeRange attributeRange = p.attributes().sourceRange("id");
+        assertEquals("2,5:25-2,7:27=2,8:28-2,9:29", attributeRange.toString());
+
+        Document clean = new Cleaner(Safelist.relaxed().addAttributes("p", "id")).clean(orig);
         Element cleanP = clean.expectFirst("p");
+        assertEquals("1", cleanP.id());
         Range cleanRange = cleanP.sourceRange();
-        assertEquals(cleanRange, origRange);
-        assertEquals(clean.endSourceRange(), orig.endSourceRange());
+        assertEquals(origRange, cleanRange);
+        assertEquals(orig.endSourceRange(), clean.endSourceRange());
+        assertEquals(attributeRange, cleanP.attributes().sourceRange("id"));
     }
+
+    @ParameterizedTest @ValueSource(booleans = {true, false})
+    void cleansCaseSensitiveElements(boolean preserveCase) {
+        // https://github.com/jhy/jsoup/issues/2049
+        String html = "<svg><feMerge baseFrequency=2><feMergeNode kernelMatrix=1 /><feMergeNode><clipPath /></feMergeNode><feMergeNode />";
+        String[] tags = {"svg", "feMerge", "feMergeNode", "clipPath"};
+        String[] attrs = {"kernelMatrix", "baseFrequency"};
+
+        if (!preserveCase) {
+            tags = Arrays.stream(tags).map(String::toLowerCase).toArray(String[]::new);
+            attrs = Arrays.stream(attrs).map(String::toLowerCase).toArray(String[]::new);
+        }
+
+        Safelist safelist = Safelist.none().addTags(tags).addAttributes(":all", attrs);
+        String clean = Jsoup.clean(html, safelist);
+        String expected = "<svg>\n" +
+            " <feMerge baseFrequency=\"2\">\n" +
+            "  <feMergeNode kernelMatrix=\"1\" />\n" +
+            "  <feMergeNode>\n" +
+            "   <clipPath />\n" +
+            "  </feMergeNode>\n" +
+            "  <feMergeNode />\n" +
+            " </feMerge>\n" +
+            "</svg>";
+        assertEquals(expected, clean);
+    }
+
 }
diff --git a/src/test/java/org/jsoup/select/ElementsTest.java b/src/test/java/org/jsoup/select/ElementsTest.java
index d1895752e8..b5ea4ef358 100644
--- a/src/test/java/org/jsoup/select/ElementsTest.java
+++ b/src/test/java/org/jsoup/select/ElementsTest.java
@@ -11,9 +11,11 @@
 import org.jsoup.nodes.TextNode;
 import org.junit.jupiter.api.Test;
 
+import java.util.Iterator;
 import java.util.List;
 
 import static org.junit.jupiter.api.Assertions.*;
+import static org.junit.jupiter.api.Assertions.assertFalse;
 
 /**
  Tests for ElementList.
@@ -435,4 +437,166 @@ public void tail(Node node, int depth) {
         assertEquals("http://example.com/bar", absAttrs.get(1));
         assertEquals("http://example.com", absAttrs.get(2));
     }
+
+    @Test public void setElementByIndex() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three");
+        Element newP = doc.createElement("p").text("New").attr("id", "new");
+
+        Elements ps = doc.select("p");
+        Element two = ps.get(1);
+        Element old = ps.set(1, newP);
+        assertSame(old, two);
+        assertSame(newP, ps.get(1)); // replaced in list
+        assertEquals("<p>One</p>\n<p id=\"new\">New</p>\n<p>Three</p>", doc.body().html()); // replaced in dom
+    }
+
+    @Test public void removeElementByIndex() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three");
+
+        Elements ps = doc.select("p");
+        Element two = ps.get(1);
+        assertTrue(ps.contains(two));
+        Element old = ps.remove(1);
+        assertSame(old, two);
+
+        assertEquals(2, ps.size()); // removed from list
+        assertFalse(ps.contains(old));
+        assertEquals("<p>One</p>\n<p>Three</p>", doc.body().html()); // removed from dom
+    }
+
+    @Test public void removeElementByObject() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three");
+
+        Elements ps = doc.select("p");
+        Element two = ps.get(1);
+        assertTrue(ps.contains(two));
+        boolean removed = ps.remove(two);
+        assertTrue(removed);
+
+        assertEquals(2, ps.size()); // removed from list
+        assertFalse(ps.contains(two));
+        assertEquals("<p>One</p>\n<p>Three</p>", doc.body().html()); // removed from dom
+    }
+
+    @Test public void removeElementObjectNoops() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three");
+        String origHtml = doc.html();
+        Element newP = doc.createElement("p").text("New");
+
+        Elements ps = doc.select("p");
+        int size = ps.size();
+        assertFalse(ps.remove(newP));
+        assertFalse(ps.remove(newP.childNodes()));
+        assertEquals(origHtml, doc.html());
+        assertEquals(size, ps.size());
+    }
+
+    @Test public void clear() {
+        Document doc = Jsoup.parse("<p>One</p><p>Two</p><div>Three</div>");
+        Elements ps = doc.select("p");
+        assertEquals(2, ps.size());
+        ps.clear();
+        assertEquals(0, ps.size());
+
+        assertEquals(0, doc.select("p").size());
+    }
+
+    @Test public void removeAll() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three<p>Four</p><div>Div");
+        Elements ps = doc.select("p");
+        assertEquals(4, ps.size());
+        Elements midPs = doc.select("p:gt(0):lt(3)"); //Two and Three
+        assertEquals(2, midPs.size());
+
+        boolean removed = ps.removeAll(midPs);
+        assertEquals(2, ps.size());
+        assertTrue(removed);
+        assertEquals(2, midPs.size());
+
+        Elements divs = doc.select("div");
+        assertEquals(1, divs.size());
+        assertFalse(ps.removeAll(divs));
+        assertEquals(2, ps.size());
+
+        assertEquals("<p>One</p>\n<p>Four</p>\n<div>\n Div\n</div>", doc.body().html());
+    }
+
+    @Test public void retainAll() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three<p>Four</p><div>Div");
+        Elements ps = doc.select("p");
+        assertEquals(4, ps.size());
+        Elements midPs = doc.select("p:gt(0):lt(3)"); //Two and Three
+        assertEquals(2, midPs.size());
+
+        boolean removed = ps.retainAll(midPs);
+        assertEquals(2, ps.size());
+        assertTrue(removed);
+        assertEquals(2, midPs.size());
+
+        assertEquals("<p>Two</p>\n<p>Three</p>\n<div>\n Div\n</div>", doc.body().html());
+
+        Elements psAgain = doc.select("p");
+        assertFalse(midPs.retainAll(psAgain));
+
+        assertEquals("<p>Two</p>\n<p>Three</p>\n<div>\n Div\n</div>", doc.body().html());
+    }
+
+    @Test public void iteratorRemovesFromDom() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three<p>Four");
+        Elements ps = doc.select("p");
+
+        assertEquals(4, ps.size());
+        for (Iterator<Element> it = ps.iterator(); it.hasNext(); ) {
+            Element el = it.next();
+            if (el.text().contains("Two"))
+                it.remove();
+        }
+        assertEquals(3, ps.size());
+        assertEquals("<p>One</p>\n<p>Three</p>\n<p>Four</p>", doc.body().html());
+    }
+
+    @Test public void removeIf() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three<p>Four");
+        Elements ps = doc.select("p");
+
+        assertEquals(4, ps.size());
+        boolean removed = ps.removeIf(el -> el.text().contains("Two"));
+        assertTrue(removed);
+        assertEquals(3, ps.size());
+        assertEquals("<p>One</p>\n<p>Three</p>\n<p>Four</p>", doc.body().html());
+
+        assertFalse(ps.removeIf(el -> el.text().contains("Five")));
+        assertEquals("<p>One</p>\n<p>Three</p>\n<p>Four</p>", doc.body().html());
+    }
+
+    @Test public void removeIfSupportsConcurrentRead() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three<p>Four");
+        Elements ps = doc.select("p");
+        assertEquals(4, ps.size());
+
+        boolean removed = ps.removeIf(el -> ps.contains(el));
+        assertTrue(removed);
+        assertEquals(0, ps.size());
+        assertEquals("", doc.body().html());
+    }
+
+    @Test public void replaceAll() {
+        Document doc = Jsoup.parse("<p>One<p>Two<p>Three<p>Four");
+        Elements ps = doc.select("p");
+        assertEquals(4, ps.size());
+
+        ps.replaceAll(el -> {
+            Element div = doc.createElement("div");
+            div.text(el.text());
+            return div;
+        });
+
+        // Check Elements
+        for (Element p : ps) {
+            assertEquals("div", p.tagName());
+        }
+
+        // check dom
+        assertEquals("<div> One</div><div> Two</div><div> Three</div><div> Four</div>", TextUtil.normalizeSpaces(doc.body().html()));
+    }
 }
diff --git a/src/test/java/org/jsoup/select/QueryParserTest.java b/src/test/java/org/jsoup/select/QueryParserTest.java
index ae2f344886..51b7c925d2 100644
--- a/src/test/java/org/jsoup/select/QueryParserTest.java
+++ b/src/test/java/org/jsoup/select/QueryParserTest.java
@@ -18,10 +18,10 @@ public class QueryParserTest {
                 "<a><li><strong>l2</strong></li></a>" +
                 "<p><strong>yes</strong></p>" +
                 "</body></html>");
-        assertEquals("l1 l2 yes", doc.body().select(">p>strong,>*>li>strong").text());
+        assertEquals("l1 yes", doc.body().select(">p>strong,>li>strong").text()); // selecting immediate from body
+        assertEquals("l2 yes", doc.select("body>p>strong,body>*>li>strong").text());
+        assertEquals("l2 yes", doc.select("body>*>li>strong,body>p>strong").text());
         assertEquals("l2 yes", doc.select("body>p>strong,body>*>li>strong").text());
-        assertEquals("yes", doc.select(">body>*>li>strong,>body>p>strong").text());
-        assertEquals("l2", doc.select(">body>p>strong,>body>*>li>strong").text());
     }
 
     @Test public void testImmediateParentRun() {
diff --git a/src/test/java/org/jsoup/select/SelectorTest.java b/src/test/java/org/jsoup/select/SelectorTest.java
index 3196dc2527..cd2f519a27 100644
--- a/src/test/java/org/jsoup/select/SelectorTest.java
+++ b/src/test/java/org/jsoup/select/SelectorTest.java
@@ -19,16 +19,31 @@
  * @author Jonathan Hedley, jonathan@hedley.net
  */
 public class SelectorTest {
+
+    /** Test that the selected elements match exactly the specified IDs. */
+    static void assertSelectedIds(Elements els, String... ids) {
+        assertNotNull(els);
+        assertEquals(ids.length, els.size(), "Incorrect number of selected elements");
+        for (int i = 0; i < ids.length; i++) {
+            assertEquals(ids[i], els.get(i).id(), "Incorrect content at index");
+        }
+    }
+
+    static void assertSelectedOwnText(Elements els, String... ownTexts) {
+        assertNotNull(els);
+        assertEquals(ownTexts.length, els.size(), "Incorrect number of selected elements");
+        for (int i = 0; i < ownTexts.length; i++) {
+            assertEquals(ownTexts[i], els.get(i).ownText(), "Incorrect content at index");
+        }
+    }
+
     @Test public void testByTag() {
-        // should be case insensitive
+        // should be case-insensitive
         Elements els = Jsoup.parse("<div id=1><div id=2><p>Hello</p></div></div><DIV id=3>").select("DIV");
-        assertEquals(3, els.size());
-        assertEquals("1", els.get(0).id());
-        assertEquals("2", els.get(1).id());
-        assertEquals("3", els.get(2).id());
+        assertSelectedIds(els, "1", "2", "3");
 
         Elements none = Jsoup.parse("<div id=1><div id=2><p>Hello</p></div></div><div id=3>").select("span");
-        assertEquals(0, none.size());
+        assertTrue(none.isEmpty());
     }
 
     @Test public void byEscapedTag() {
@@ -44,12 +59,10 @@ public class SelectorTest {
 
     @Test public void testById() {
         Elements els = Jsoup.parse("<div><p id=foo>Hello</p><p id=foo>Foo two!</p></div>").select("#foo");
-        assertEquals(2, els.size());
-        assertEquals("Hello", els.get(0).text());
-        assertEquals("Foo two!", els.get(1).text());
+        assertSelectedOwnText(els, "Hello", "Foo two!");
 
         Elements none = Jsoup.parse("<div id=1></div>").select("#foo");
-        assertEquals(0, none.size());
+        assertTrue(none.isEmpty());
     }
 
     @Test public void byEscapedId() {
@@ -67,22 +80,18 @@ public class SelectorTest {
 
     @Test public void testByClass() {
         Elements els = Jsoup.parse("<p id=0 class='ONE two'><p id=1 class='one'><p id=2 class='two'>").select("P.One");
-        assertEquals(2, els.size());
-        assertEquals("0", els.get(0).id());
-        assertEquals("1", els.get(1).id());
+        assertSelectedIds(els, "0", "1");
 
         Elements none = Jsoup.parse("<div class='one'></div>").select(".foo");
-        assertEquals(0, none.size());
+        assertTrue(none.isEmpty());
 
-        Elements els2 = Jsoup.parse("<div class='One-Two'></div>").select(".one-two");
-        assertEquals(1, els2.size());
+        Elements els2 = Jsoup.parse("<div class='One-Two' id=1></div>").select(".one-two");
+        assertSelectedIds(els2, "1");
     }
 
     @Test public void byEscapedClass() {
-        Element els = Jsoup.parse("<p class='one.two#three'>One</p>");
-
-        Element one = els.expectFirst("p.one\\.two\\#three");
-        assertEquals("One", one.text());
+        Document doc = Jsoup.parse("<p class='one.two#three'>One</p>");
+        assertSelectedOwnText(doc.select("p.one\\.two\\#three"), "One");
     }
 
     @Test public void testByClassCaseInsensitive() {
@@ -91,8 +100,7 @@ public class SelectorTest {
         Elements elsFromAttr = Jsoup.parse(html).select("p[class=foo]");
 
         assertEquals(elsFromAttr.size(), elsFromClass.size());
-        assertEquals(3, elsFromClass.size());
-        assertEquals("Two", elsFromClass.get(1).text());
+        assertSelectedOwnText(elsFromClass, "One", "Two", "Three");
     }
 
 
@@ -143,43 +151,31 @@ public void testByAttribute(Locale locale) {
     @Test public void testNamespacedTag() {
         Document doc = Jsoup.parse("<div><abc:def id=1>Hello</abc:def></div> <abc:def class=bold id=2>There</abc:def>");
         Elements byTag = doc.select("abc|def");
-        assertEquals(2, byTag.size());
-        assertEquals("1", byTag.first().id());
-        assertEquals("2", byTag.last().id());
+        assertSelectedIds(byTag, "1", "2");
 
         Elements byAttr = doc.select(".bold");
-        assertEquals(1, byAttr.size());
-        assertEquals("2", byAttr.last().id());
+        assertSelectedIds(byAttr, "2");
 
         Elements byTagAttr = doc.select("abc|def.bold");
-        assertEquals(1, byTagAttr.size());
-        assertEquals("2", byTagAttr.last().id());
+        assertSelectedIds(byTagAttr, "2");
 
         Elements byContains = doc.select("abc|def:contains(e)");
-        assertEquals(2, byContains.size());
-        assertEquals("1", byContains.first().id());
-        assertEquals("2", byContains.last().id());
+        assertSelectedIds(byContains, "1", "2");
     }
 
     @Test public void testWildcardNamespacedTag() {
         Document doc = Jsoup.parse("<div><abc:def id=1>Hello</abc:def></div> <abc:def class=bold id=2>There</abc:def>");
         Elements byTag = doc.select("*|def");
-        assertEquals(2, byTag.size());
-        assertEquals("1", byTag.first().id());
-        assertEquals("2", byTag.last().id());
+        assertSelectedIds(byTag, "1", "2");
 
         Elements byAttr = doc.select(".bold");
-        assertEquals(1, byAttr.size());
-        assertEquals("2", byAttr.last().id());
+        assertSelectedIds(byAttr, "2");
 
         Elements byTagAttr = doc.select("*|def.bold");
-        assertEquals(1, byTagAttr.size());
-        assertEquals("2", byTagAttr.last().id());
+        assertSelectedIds(byTagAttr, "2");
 
         Elements byContains = doc.select("*|def:contains(e)");
-        assertEquals(2, byContains.size());
-        assertEquals("1", byContains.first().id());
-        assertEquals("2", byContains.last().id());
+        assertSelectedIds(byContains, "1", "2");
     }
 
     @Test public void testWildcardNamespacedXmlTag() {
@@ -189,22 +185,16 @@ public void testByAttribute(Locale locale) {
         );
 
         Elements byTag = doc.select("*|Def");
-        assertEquals(2, byTag.size());
-        assertEquals("1", byTag.first().id());
-        assertEquals("2", byTag.last().id());
+        assertSelectedIds(byTag, "1", "2");
 
         Elements byAttr = doc.select(".bold");
-        assertEquals(1, byAttr.size());
-        assertEquals("2", byAttr.last().id());
+        assertSelectedIds(byAttr, "2");
 
         Elements byTagAttr = doc.select("*|Def.bold");
-        assertEquals(1, byTagAttr.size());
-        assertEquals("2", byTagAttr.last().id());
+        assertSelectedIds(byTagAttr, "2");
 
         Elements byContains = doc.select("*|Def:contains(e)");
-        assertEquals(2, byContains.size());
-        assertEquals("1", byContains.first().id());
-        assertEquals("2", byContains.last().id());
+        assertSelectedIds(byContains, "1", "2");
     }
 
     @Test public void testWildCardNamespacedCaseVariations() {
@@ -242,18 +232,13 @@ public void testByAttributeStarting(Locale locale) {
     @Test public void testByAttributeRegex() {
         Document doc = Jsoup.parse("<p><img src=foo.png id=1><img src=bar.jpg id=2><img src=qux.JPEG id=3><img src=old.gif><img></p>");
         Elements imgs = doc.select("img[src~=(?i)\\.(png|jpe?g)]");
-        assertEquals(3, imgs.size());
-        assertEquals("1", imgs.get(0).id());
-        assertEquals("2", imgs.get(1).id());
-        assertEquals("3", imgs.get(2).id());
+        assertSelectedIds(imgs, "1", "2", "3");
     }
 
     @Test public void testByAttributeRegexCharacterClass() {
         Document doc = Jsoup.parse("<p><img src=foo.png id=1><img src=bar.jpg id=2><img src=qux.JPEG id=3><img src=old.gif id=4></p>");
         Elements imgs = doc.select("img[src~=[o]]");
-        assertEquals(2, imgs.size());
-        assertEquals("1", imgs.get(0).id());
-        assertEquals("4", imgs.get(1).id());
+        assertSelectedIds(imgs, "1", "4");
     }
 
     @Test public void testByAttributeRegexCombined() {
@@ -1172,13 +1157,67 @@ public void wildcardNamespaceMatchesNoNamespace() {
         Elements empty = doc.select("li:empty");
         Elements notEmpty = doc.select("li:not(:empty)");
 
-        assertEquals(3, empty.size());
-        assertEquals(2, notEmpty.size());
+        assertSelectedIds(empty, "1", "2", "3");
+        assertSelectedIds(notEmpty, "4", "5");
+    }
+
+    @Test public void parentFromSpecifiedDescender() {
+        // https://github.com/jhy/jsoup/issues/2018
+        String html = "<ul id=outer><li>Foo</li><li>Bar <ul id=inner><li>Baz</li><li>Qux</li></ul> </li></ul>";
+        Document doc = Jsoup.parse(html);
+
+        Element ul = doc.expectFirst("#outer");
+        assertEquals(2, ul.childrenSize());
+
+        Element li1 = ul.expectFirst("> li:nth-child(1)");
+        assertEquals("Foo", li1.ownText());
+        assertTrue(li1.select("ul").isEmpty());
+
+        Element li2 = ul.expectFirst("> li:nth-child(2)");
+        assertEquals("Bar", li2.ownText());
+
+        // And now for the bug - li2 select was not restricted to the li2 context
+        Elements innerLis = li2.select("ul > li");
+        assertSelectedOwnText(innerLis, "Baz", "Qux");
+
+        // Confirm that parent selector (" ") works same as immediate parent (">");
+        Elements innerLisFromParent = li2.select("ul li");
+        assertEquals(innerLis, innerLisFromParent);
+    }
+
+    @Test public void rootImmediateParentSubquery() {
+        // a combinator at the start of the query is applied to the Root selector. i.e. "> p" matches a P immediately parented
+        // by the Root (which is <html> for a top level query, or the context element in :has)
+        // in the sub query, the combinator was dropped incorrectly
+        String html = "<p id=0><span>A</p> <p id=1><b><i><span>B</p> <p id=2><i>C</p>\n";
+        Document doc = Jsoup.parse(html);
+
+        Elements els = doc.select("p:has(> span, > i)"); // should match a p with an immediate span or i
+        assertSelectedIds(els, "0", "2");
+    }
+
+    @Test public void is() {
+        String html = "<h1 id=1><p></p></h1> <section><h1 id=2></h1></section> <article><h2 id=3></h2></article> <h2 id=4><p></p></h2>";
+        Document doc = Jsoup.parse(html);
+
+        assertSelectedIds(
+            doc.select(":is(section, article) :is(h1, h2, h3)"),
+            "2", "3");
+
+        assertSelectedIds(
+            doc.select(":is(section, article) ~ :is(h1, h2, h3):has(p)"),
+            "4");
+
+        assertSelectedIds(
+            doc.select(":is(h1:has(p), h2:has(section), h3)"),
+            "1");
+
+        assertSelectedIds(
+            doc.select(":is(h1, h2, h3):has(p)"),
+            "1", "4");
 
-        assertEquals("1", empty.get(0).id());
-        assertEquals("2", empty.get(1).id());
-        assertEquals("3", empty.get(2).id());
-        assertEquals("4", notEmpty.get(0).id());
-        assertEquals("5", notEmpty.get(1).id());
+        String query = "div :is(h1, h2)";
+        Evaluator parse = QueryParser.parse(query);
+        assertEquals(query, parse.toString());
     }
 }
diff --git a/src/test/java/org/jsoup/select/TraversorTest.java b/src/test/java/org/jsoup/select/TraversorTest.java
index 11a5167d61..2b1da28137 100644
--- a/src/test/java/org/jsoup/select/TraversorTest.java
+++ b/src/test/java/org/jsoup/select/TraversorTest.java
@@ -8,8 +8,10 @@
 import org.jsoup.nodes.TextNode;
 import org.junit.jupiter.api.Test;
 
-import static org.junit.jupiter.api.Assertions.assertEquals;
-import static org.junit.jupiter.api.Assertions.assertNotNull;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static org.junit.jupiter.api.Assertions.*;
 
 public class TraversorTest {
     // Note: NodeTraversor.traverse(new NodeVisitor) is tested in
@@ -193,4 +195,29 @@ else if (node instanceof TextNode && ((TextNode) node).text().equals("Three"))
 
         assertEquals("<div><p id=\"2\">Two</p><p></p></div>", TextUtil.stripNewlines(doc.body().html()));
     }
+
+    @Test void elementFunctionalTraverse() {
+        Document doc = Jsoup.parse("<div><p>1<p>2<p>3");
+        Element body = doc.body();
+
+        AtomicInteger seenCount = new AtomicInteger();
+        AtomicInteger deepest = new AtomicInteger();
+        body.traverse((node, depth) -> {
+            seenCount.incrementAndGet();
+            if (depth > deepest.get()) deepest.set(depth);
+        });
+
+        assertEquals(8, seenCount.get()); // body and contents
+        assertEquals(3, deepest.get());
+    }
+
+    @Test void seesDocRoot() {
+        Document doc = Jsoup.parse("<p>One");
+        AtomicBoolean seen = new AtomicBoolean(false);
+        doc.traverse((node, depth) -> {
+            if (node.equals(doc))
+                seen.set(true);
+        });
+        assertTrue(seen.get());
+    }
 }
diff --git a/src/test/resources/htmltests/osi-logo.svg b/src/test/resources/htmltests/osi-logo.svg
new file mode 100644
index 0000000000..1aefc1007c
--- /dev/null
+++ b/src/test/resources/htmltests/osi-logo.svg
@@ -0,0 +1,185 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="8in"
+   height="11in"
+   viewBox="0 0 576 792.00001"
+   version="1.2"
+   id="svg5"
+   sodipodi:docname="OurInSourceLogo.eps"
+   inkscape:version="0.92.3 (2405546, 2018-03-11)">
+  <metadata
+     id="metadata11">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs9" />
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="1600"
+     inkscape:window-height="863"
+     id="namedview7"
+     showgrid="false"
+     units="in"
+     inkscape:zoom="1"
+     inkscape:cx="180.72684"
+     inkscape:cy="645.05307"
+     inkscape:window-x="0"
+     inkscape:window-y="0"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg5" />
+  <g
+     id="surface480"
+     transform="translate(56.319251,47.201249)">
+    <path
+       style="fill:#3da638;fill-opacity:1;fill-rule:nonzero;stroke:#1c511c;stroke-width:153.69700623;stroke-linecap:round;stroke-linejoin:round;stroke-miterlimit:4;stroke-opacity:1"
+       d="m 2607.2266,1436.6797 c 322.5781,119.8047 490.9765,350.5078 490.9765,747.5781 0,397.0703 -334.6093,746.9531 -752.6953,747.6563 -441.2109,0.7031 -774.0234,-349.1407 -768.7109,-747.6563 5.3125,-398.5156 195.3906,-663.6328 499.5703,-759.4922 L 1537.5,99.0625 C 816.28906,285.78125 82.773438,1136.6016 82.773438,2184.2578 c 0,1240.8594 997.031262,2246.7969 2246.718762,2246.7969 1249.6875,0 2262.7344,-1005.9375 2262.7344,-2246.7969 0,-1063.9453 -726.5625,-1902.92968 -1463.1641,-2088.906238 z m 0,0"
+       transform="matrix(0.1,0,0,-0.1,0,451)"
+       id="path2"
+       inkscape:connector-curvature="0" />
+  </g>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot3726"
+     style="fill:black;stroke:none;stroke-opacity:1;stroke-width:1px;stroke-linejoin:miter;stroke-linecap:butt;fill-opacity:1;font-family:Open Sans;font-style:normal;font-weight:normal;font-size:72px;-inkscape-font-specification:Open Sans;line-height:125%;letter-spacing:0px;word-spacing:0px;font-stretch:normal;font-variant:normal;text-anchor:start;text-align:start;writing-mode:lr"><flowRegion
+       id="flowRegion3728"><rect
+         id="rect3730"
+         width="575.70789"
+         height="214.01315"
+         x="78.846954"
+         y="733.10297" /></flowRegion><flowPara
+       id="flowPara3732" /></flowRoot>  <flowRoot
+     xml:space="preserve"
+     id="flowRoot3734"
+     style="fill:black;stroke:none;stroke-opacity:1;stroke-width:1px;stroke-linejoin:miter;stroke-linecap:butt;fill-opacity:1;font-family:Open Sans;font-style:normal;font-weight:normal;font-size:72px;-inkscape-font-specification:Open Sans;line-height:125%;letter-spacing:0px;word-spacing:0px;font-stretch:normal;font-variant:normal;text-anchor:start;text-align:start;writing-mode:lr"><flowRegion
+       id="flowRegion3736"><rect
+         id="rect3738"
+         width="635.7818"
+         height="287.85394"
+         x="88.859261"
+         y="688.04755" /></flowRegion><flowPara
+       id="flowPara3740" /></flowRoot>  <g
+     aria-label="open source initiative"
+     transform="matrix(1.0829245,0,0,1.148944,-0.49785346,-115.50738)"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:54px;line-height:125%;font-family:'Open Sans';-inkscape-font-specification:'Open Sans';text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.75px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1"
+     id="flowRoot3742">
+    <path
+       d="m 91.042969,583.30725 q 0,9.77344 -5.273438,15.25781 -5.238281,5.44922 -14.695312,5.44922 -9.070313,0 -14.449219,-5.58984 -5.34375,-5.58985 -5.34375,-15.11719 0,-9.73828 5.238281,-15.11719 5.273438,-5.41406 14.765625,-5.41406 5.871094,0 10.371094,2.49609 4.5,2.4961 6.925781,7.17188 2.460938,4.64062 2.460938,10.86328 z m -25.804688,0 q 0,5.13281 1.371094,7.83984 1.371094,2.67188 4.605469,2.67188 3.199218,0 4.5,-2.67188 1.335937,-2.70703 1.335937,-7.83984 0,-5.09766 -1.335937,-7.69922 -1.335938,-2.60156 -4.570313,-2.60156 -3.164062,0 -4.535156,2.60156 -1.371094,2.56641 -1.371094,7.69922 z"
+       style="font-style:normal;font-variant:normal;font-weight:800;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Ultra-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3756" />
+    <path
+       d="m 122.75391,604.01428 q -3.02344,0 -5.41407,-0.98437 -2.39062,-1.01953 -4.74609,-3.6211 h -0.63281 q 0.63281,4.1836 0.63281,5.20313 v 15.99609 H 98.847656 v -57.1289 h 11.179684 l 1.9336,5.0625 h 0.63281 q 3.83203,-5.76563 10.58203,-5.76563 6.60938,0 10.37109,5.48438 3.76172,5.48437 3.76172,15.04687 0,9.63281 -3.9375,15.1875 -3.90234,5.51953 -10.61718,5.51953 z m -4.60547,-30.44531 q -3.02344,0 -4.25391,2.17969 -1.19531,2.14453 -1.30078,6.39843 v 1.08985 q 0,5.13281 1.37109,7.41797 1.3711,2.28515 4.32422,2.28515 2.63672,0 3.83203,-2.25 1.19532,-2.28515 1.19532,-7.52343 0,-5.13282 -1.19532,-7.34766 -1.19531,-2.25 -3.97265,-2.25 z"
+       style="font-style:normal;font-variant:normal;font-weight:800;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Ultra-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3758" />
+    <path
+       d="m 164.34375,604.01428 q -9.94922,0 -15.46875,-5.27344 -5.48438,-5.30859 -5.48438,-15.08203 0,-10.08984 5.09766,-15.46875 5.09766,-5.41406 14.55469,-5.41406 9,0 13.88672,4.71094 4.92187,4.67578 4.92187,13.5 v 6.11719 h -24.57422 q 0.14063,3.33984 2.42578,5.23828 2.32032,1.89843 6.29297,1.89843 3.6211,0 6.64453,-0.66796 3.0586,-0.70313 6.60938,-2.35547 v 9.8789 q -3.23438,1.65235 -6.67969,2.28516 -3.44531,0.63281 -8.22656,0.63281 z m -0.80859,-31.88672 q -2.42579,0 -4.07813,1.54688 -1.61719,1.51172 -1.89844,4.78125 h 11.8125 q -0.0703,-2.88281 -1.65234,-4.60547 -1.54688,-1.72266 -4.18359,-1.72266 z"
+       style="font-style:normal;font-variant:normal;font-weight:800;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Ultra-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3760" />
+    <path
+       d="m 214.82812,603.31116 v -21.72657 q 0,-3.97265 -1.16015,-5.97656 -1.125,-2.03906 -3.65625,-2.03906 -3.48047,0 -5.02735,2.77734 -1.54687,2.77735 -1.54687,9.52735 v 17.4375 h -13.74609 v -39.83203 h 10.37109 l 1.72266,4.92187 h 0.80859 q 1.75781,-2.8125 4.85156,-4.21875 3.12891,-1.40625 7.17188,-1.40625 6.60937,0 10.26562,3.83203 3.69141,3.83203 3.69141,10.79297 v 25.91016 z"
+       style="font-style:normal;font-variant:normal;font-weight:800;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Ultra-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3762" />
+    <path
+       d="m 283.91016,592.23694 q 0,5.69531 -4.14844,8.7539 -4.14844,3.02344 -11.88281,3.02344 -7.76954,0 -12.48047,-2.35547 v -7.13672 q 6.85547,3.16407 12.76172,3.16407 7.6289,0 7.6289,-4.60547 0,-1.47656 -0.84375,-2.46094 -0.84375,-0.98437 -2.77734,-2.03906 -1.9336,-1.05469 -5.37891,-2.39063 -6.71484,-2.60156 -9.10547,-5.20312 -2.35547,-2.60156 -2.35547,-6.75 0,-4.99219 4.00782,-7.73438 4.04297,-2.77734 10.96875,-2.77734 6.85547,0 12.97265,2.77734 l -2.67187,6.22266 q -6.29297,-2.60156 -10.58203,-2.60156 -6.53907,0 -6.53907,3.72656 0,1.82812 1.6875,3.09375 1.72266,1.26562 7.45313,3.48047 4.81641,1.86328 6.99609,3.41015 2.17969,1.54688 3.23438,3.58594 1.05469,2.00391 1.05469,4.81641 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3764" />
+    <path
+       d="m 327.29297,583.79944 q 0,9.52734 -4.88672,14.87109 -4.88672,5.34375 -13.60547,5.34375 -5.44922,0 -9.63281,-2.46094 -4.1836,-2.46093 -6.4336,-7.0664 -2.25,-4.60547 -2.25,-10.6875 0,-9.45703 4.85157,-14.76563 4.85156,-5.30859 13.67578,-5.30859 8.4375,0 13.35937,5.44922 4.92188,5.41406 4.92188,14.625 z m -28.30078,0 q 0,13.46484 9.94922,13.46484 9.84375,0 9.84375,-13.46484 0,-13.32422 -9.91407,-13.32422 -5.20312,0 -7.55859,3.44531 -2.32031,3.44531 -2.32031,9.87891 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3766" />
+    <path
+       d="m 364.24219,603.31116 -1.16016,-5.09766 h -0.42187 q -1.72266,2.70703 -4.92188,4.25391 -3.16406,1.54687 -7.24219,1.54687 -7.0664,0 -10.54687,-3.51562 -3.48047,-3.51563 -3.48047,-10.65235 v -25.41797 h 8.33203 v 23.97657 q 0,4.46484 1.82813,6.71484 1.82812,2.21484 5.73046,2.21484 5.20313,0 7.62891,-3.09375 2.46094,-3.1289 2.46094,-10.4414 v -19.3711 h 8.29687 v 38.88282 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3768" />
+    <path
+       d="m 402.24609,563.72522 q 2.4961,0 4.11328,0.35156 l -0.80859,7.69922 q -1.75781,-0.42187 -3.65625,-0.42187 -4.95703,0 -8.05078,3.23437 -3.05859,3.23438 -3.05859,8.40234 v 20.32032 h -8.26172 v -38.88282 h 6.46875 l 1.08984,6.85547 h 0.42188 q 1.93359,-3.48047 5.02734,-5.51953 3.12891,-2.03906 6.71484,-2.03906 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3770" />
+    <path
+       d="m 429.28125,604.01428 q -8.82422,0 -13.42969,-5.13281 -4.57031,-5.16797 -4.57031,-14.80078 0,-9.8086 4.78125,-15.08203 4.81641,-5.27344 13.88672,-5.27344 6.15234,0 11.07422,2.28516 l -2.4961,6.64453 q -5.23828,-2.03907 -8.64843,-2.03907 -10.08985,0 -10.08985,13.39454 0,6.53906 2.4961,9.84375 2.53125,3.26953 7.38281,3.26953 5.51953,0 10.4414,-2.74219 v 7.20703 q -2.21484,1.30078 -4.74609,1.86328 -2.49609,0.5625 -6.08203,0.5625 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3772" />
+    <path
+       d="m 466.30078,604.01428 q -9.07031,0 -14.20312,-5.27344 Q 447,593.43225 447,584.151 q 0,-9.52734 4.74609,-14.97656 4.7461,-5.44922 13.04297,-5.44922 7.69922,0 12.16406,4.67578 4.46485,4.67578 4.46485,12.86719 v 4.46484 h -25.91016 q 0.17578,5.66016 3.0586,8.71875 2.88281,3.02344 8.12109,3.02344 3.44531,0 6.39844,-0.63281 2.98828,-0.66797 6.39843,-2.17969 v 6.71484 q -3.02343,1.44141 -6.11718,2.03907 -3.09375,0.59765 -7.06641,0.59765 z m -1.51172,-34.03125 q -3.9375,0 -6.32812,2.4961 -2.35547,2.49609 -2.8125,7.27734 h 17.64843 q -0.0703,-4.81641 -2.32031,-7.27734 -2.25,-2.4961 -6.1875,-2.4961 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle"
+       id="path3774" />
+    <path
+       d="m 128.51953,675.51001 h -8.26172 V 636.6272 h 8.26172 z m -8.7539,-49.18359 q 0,-2.21485 1.19531,-3.41016 1.23047,-1.19531 3.48047,-1.19531 2.17968,0 3.375,1.19531 1.23046,1.19531 1.23046,3.41016 0,2.10937 -1.23046,3.33984 -1.19532,1.19531 -3.375,1.19531 -2.25,0 -3.48047,-1.19531 -1.19531,-1.23047 -1.19531,-3.33984 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3776" />
+    <path
+       d="m 174.57422,675.51001 h -8.29688 v -23.90625 q 0,-4.5 -1.82812,-6.71484 -1.79297,-2.21485 -5.73047,-2.21485 -5.23828,0 -7.66406,3.09375 -2.42578,3.09375 -2.42578,10.3711 v 19.37109 h -8.26172 V 636.6272 h 6.46875 l 1.16015,5.09765 h 0.42188 q 1.75781,-2.77734 4.99219,-4.28906 3.23437,-1.51172 7.17187,-1.51172 13.99219,0 13.99219,14.23828 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3778" />
+    <path
+       d="m 194.33203,675.51001 h -8.26172 V 636.6272 h 8.26172 z m -8.75391,-49.18359 q 0,-2.21485 1.19532,-3.41016 1.23047,-1.19531 3.48047,-1.19531 2.17968,0 3.375,1.19531 1.23046,1.19531 1.23046,3.41016 0,2.10937 -1.23046,3.33984 -1.19532,1.19531 -3.375,1.19531 -2.25,0 -3.48047,-1.19531 -1.19532,-1.23047 -1.19532,-3.33984 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3780" />
+    <path
+       d="m 220.66406,669.53345 q 3.02344,0 6.04688,-0.94922 v 6.22265 q -1.3711,0.59766 -3.55078,0.98438 -2.14454,0.42187 -4.46485,0.42187 -11.74219,0 -11.74219,-12.375 v -20.95312 h -5.30859 v -3.65625 l 5.69531,-3.02344 2.8125,-8.22656 H 215.25 v 8.64844 h 11.07422 v 6.25781 H 215.25 v 20.8125 q 0,2.98828 1.47656,4.42969 1.51172,1.40625 3.9375,1.40625 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3782" />
+    <path
+       d="m 242.70703,675.51001 h -8.26172 V 636.6272 h 8.26172 z m -8.75391,-49.18359 q 0,-2.21485 1.19532,-3.41016 1.23047,-1.19531 3.48047,-1.19531 2.17968,0 3.375,1.19531 1.23046,1.19531 1.23046,3.41016 0,2.10937 -1.23046,3.33984 -1.19532,1.19531 -3.375,1.19531 -2.25,0 -3.48047,-1.19531 -1.19532,-1.23047 -1.19532,-3.33984 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3784" />
+    <path
+       d="m 278.88281,675.51001 -1.65234,-5.41406 h -0.28125 q -2.8125,3.55078 -5.66016,4.85156 -2.84765,1.26562 -7.3125,1.26562 -5.73047,0 -8.96484,-3.09375 -3.19922,-3.09375 -3.19922,-8.7539 0,-6.01172 4.46484,-9.07031 4.46485,-3.0586 13.60547,-3.33985 l 6.71485,-0.21094 v -2.07421 q 0,-3.72657 -1.75782,-5.55469 -1.72265,-1.86328 -5.3789,-1.86328 -2.98828,0 -5.73047,0.8789 -2.74219,0.87891 -5.27344,2.07422 l -2.67187,-5.90625 q 3.16406,-1.65234 6.92578,-2.49609 3.76172,-0.87891 7.10156,-0.87891 7.41797,0 11.17969,3.23438 3.79687,3.23437 3.79687,10.16015 v 26.19141 z m -12.30469,-5.625 q 4.5,0 7.20704,-2.49609 2.74218,-2.53125 2.74218,-7.06641 v -3.375 l -4.99218,0.21094 q -5.83594,0.21093 -8.50782,1.96875 -2.63672,1.72265 -2.63672,5.30859 0,2.60156 1.54688,4.04297 1.54687,1.40625 4.64062,1.40625 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3786" />
+    <path
+       d="m 310.80469,669.53345 q 3.02343,0 6.04687,-0.94922 v 6.22265 q -1.37109,0.59766 -3.55078,0.98438 -2.14453,0.42187 -4.46484,0.42187 -11.74219,0 -11.74219,-12.375 v -20.95312 h -5.30859 v -3.65625 l 5.69531,-3.02344 2.8125,-8.22656 h 5.09765 v 8.64844 h 11.07422 v 6.25781 h -11.07422 v 20.8125 q 0,2.98828 1.47657,4.42969 1.51172,1.40625 3.9375,1.40625 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3788" />
+    <path
+       d="m 332.84766,675.51001 h -8.26172 V 636.6272 h 8.26172 z m -8.75391,-49.18359 q 0,-2.21485 1.19531,-3.41016 1.23047,-1.19531 3.48047,-1.19531 2.17969,0 3.375,1.19531 1.23047,1.19531 1.23047,3.41016 0,2.10937 -1.23047,3.33984 -1.19531,1.19531 -3.375,1.19531 -2.25,0 -3.48047,-1.19531 -1.19531,-1.23047 -1.19531,-3.33984 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3790" />
+    <path
+       d="M 353.55469,675.51001 338.78906,636.6272 h 8.71875 l 7.91016,22.60547 q 2.03906,5.69531 2.46094,9.21093 h 0.28125 q 0.3164,-2.53125 2.46093,-9.21093 l 7.91016,-22.60547 h 8.78906 l -14.83594,38.88281 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3792" />
+    <path
+       d="m 400.20703,676.21313 q -9.07031,0 -14.20312,-5.27343 -5.09766,-5.3086 -5.09766,-14.58985 0,-9.52734 4.74609,-14.97656 4.7461,-5.44922 13.04297,-5.44922 7.69922,0 12.16406,4.67578 4.46485,4.67578 4.46485,12.86719 v 4.46484 h -25.91016 q 0.17578,5.66016 3.0586,8.71875 2.88281,3.02344 8.12109,3.02344 3.44531,0 6.39844,-0.63281 2.98828,-0.66797 6.39843,-2.17969 v 6.71485 q -3.02343,1.4414 -6.11718,2.03906 -3.09375,0.59765 -7.06641,0.59765 z m -1.51172,-34.03125 q -3.9375,0 -6.32812,2.4961 -2.35547,2.49609 -2.8125,7.27734 h 17.64843 q -0.0703,-4.8164 -2.32031,-7.27734 -2.25,-2.4961 -6.1875,-2.4961 z"
+       style="font-style:normal;font-variant:normal;font-weight:600;font-stretch:normal;font-size:72px;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Semi-Bold';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:center;writing-mode:lr-tb;text-anchor:middle;stroke-width:0.75px"
+       id="path3794" />
+    <g
+       aria-label="®"
+       transform="matrix(0.69256906,0,0,0.65277333,405.24465,262.29382)"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:48px;line-height:125%;font-family:'Open Sans';-inkscape-font-specification:'Open Sans, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1"
+       id="flowRoot3797">
+      <path
+         d="m 38.220703,565.03621 h 2.53125 q 1.875,0 3,-0.96093 1.148438,-0.98438 1.148438,-2.48438 0,-1.75781 -1.007813,-2.50781 -1.007812,-0.77344 -3.1875,-0.77344 h -2.484375 z m 10.171875,-3.53906 q 0,1.875 -1.007812,3.32813 -0.984375,1.42968 -2.789063,2.13281 l 5.578125,9.25781 h -3.9375 l -4.851562,-8.29687 h -3.164063 v 8.29687 h -3.46875 v -20.88281 h 6.117188 q 3.890625,0 5.695312,1.52344 1.828125,1.52343 1.828125,4.64062 z m -24.773437,4.26563 q 0,-4.6875 2.34375,-8.78907 2.34375,-4.10156 6.445312,-6.46875 4.101563,-2.36718 8.835938,-2.36718 4.6875,0 8.789062,2.34375 4.101563,2.34375 6.46875,6.44531 2.367188,4.10156 2.367188,8.83594 0,4.61718 -2.273438,8.67187 -2.273437,4.05469 -6.375,6.49219 -4.101562,2.4375 -8.976562,2.4375 -4.851563,0 -8.953125,-2.41406 -4.101563,-2.4375 -6.398438,-6.49219 -2.273437,-4.05469 -2.273437,-8.69531 z m 2.460937,0 q 0,4.05468 2.039063,7.59375 2.039062,3.51562 5.554687,5.55468 3.539063,2.01563 7.570313,2.01563 4.078125,0 7.570312,-2.03906 3.492188,-2.03907 5.53125,-5.50782 2.0625,-3.49218 2.0625,-7.61718 0,-4.07813 -2.039062,-7.57032 -2.039063,-3.49218 -5.53125,-5.53125 -3.46875,-2.0625 -7.59375,-2.0625 -4.078125,0 -7.570313,2.03907 -3.492187,2.03906 -5.554687,5.53125 -2.039063,3.46875 -2.039063,7.59375 z"
+         style=""
+         id="path3805" />
+    </g>
+  </g>
+  <ellipse
+     style="color:#000000;display:inline;overflow:visible;visibility:visible;fill:none;fill-opacity:1;fill-rule:nonzero;stroke:none;stroke-width:7.43444252;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:none;stroke-dashoffset:0;stroke-opacity:1;marker:none;enable-background:accumulate"
+     id="path256"
+     cx="-31.875"
+     cy="191.25"
+     rx="229.24777"
+     ry="226.62277" />
+</svg>
diff --git a/src/test/resources/local-cert/README.md b/src/test/resources/local-cert/README.md
new file mode 100644
index 0000000000..2d4cbe5e38
--- /dev/null
+++ b/src/test/resources/local-cert/README.md
@@ -0,0 +1,15 @@
+This directory contains resources for a self-signed TLS certificate, used in jsoup's local integration tests.
+
+Create the certificate:
+
+```sh
+openssl genrsa 2048 > server.key
+chmod 400 server.key
+openssl req -new -x509 -config cert.conf -nodes -sha256 -days 36135 -key server.key -out server.crt
+```
+
+Create the Java key store. Used by server, and trusted by client, in `TestServer.java`:
+```sh
+openssl pkcs12 -export -in server.crt -inkey server.key -out server.p12 -name jsoup -passout pass:hunter2
+keytool -importkeystore -srckeystore server.p12 -srcstoretype PKCS12 -destkeystore server.pfx -deststoretype PKCS12  -srcstorepass hunter2 -deststorepass hunter2
+```
diff --git a/src/test/resources/local-cert/cert.conf b/src/test/resources/local-cert/cert.conf
new file mode 100644
index 0000000000..c9019e4828
--- /dev/null
+++ b/src/test/resources/local-cert/cert.conf
@@ -0,0 +1,13 @@
+[ req ]
+distinguished_name  = subject
+x509_extensions     = x509_ext
+prompt              = no
+
+[ subject ]
+commonName          = jsoup test server
+
+[ x509_ext ]
+subjectAltName      = @alternate_names
+
+[ alternate_names ]
+DNS.1               = localhost
diff --git a/src/test/resources/local-cert/server.crt b/src/test/resources/local-cert/server.crt
new file mode 100644
index 0000000000..27d549edab
--- /dev/null
+++ b/src/test/resources/local-cert/server.crt
@@ -0,0 +1,19 @@
+-----BEGIN CERTIFICATE-----
+MIIC/zCCAeegAwIBAgIUKEHmb0P5j+5mNjNk/PTdW6t9UTcwDQYJKoZIhvcNAQEL
+BQAwHDEaMBgGA1UEAwwRanNvdXAgdGVzdCBzZXJ2ZXIwIBcNMjMxMTAyMjM0OTE1
+WhgPMjEyMjEwMDkyMzQ5MTVaMBwxGjAYBgNVBAMMEWpzb3VwIHRlc3Qgc2VydmVy
+MIIBIjANBgkqhkiG9w0BAQEFAAOCAQ8AMIIBCgKCAQEAvkvtYwy7jnSPYM59EVsR
+SjTO8WsXHVs/UJ+Ns+7RiTeb2hUOd4lh38TOh9Yri/7WI5Ejif64FL6b1KEWRe9+
+60QKIOB0+7DUpnXomisD6TytwV8R8BSEZ4vLbMUVizr95Ze+w6SzMPshSvHBMIbU
+RimtmY1jBglHytETRBjO1etG120R1M45GJfxV8rIDOgM6FksOnWLQeKzeGKBf0vs
+5MlTz/GDs/YpXydg779QOmJAQWj78EMdetwmUPwnpC0kaO3dnlD+mzDrfeSkorrp
+5UKij1k4s2tG+E/VIskGyuc/MSU6dc8/ECzuK7c/UjpUz9ohSfLwhSGdjnx0qjXm
+kwIDAQABozcwNTAUBgNVHREEDTALgglsb2NhbGhvc3QwHQYDVR0OBBYEFAWRk6Jd
+PJrlw3uJKEG7JLku9SwsMA0GCSqGSIb3DQEBCwUAA4IBAQAxEXk5d0ACzaxtOF9+
+/XF3Zt8X/eXxyoQUaG2PyfJkN1rnO7zyx/oPIIAckaZev0eFVwOk3M5K4xxYar/Y
+DqdioKwH8qAy4kk7sdCnTU8jlkUMcFqYCt7rLcDviugjg0VO6bYLrq++oeOuDybs
+M7J3CgzPAppSpRoTgss3bGzHt87rWJ2XcHxbE8Gg2GtoZnFpcSHkx40EdlDWN8dm
+/mZlMxjVFdktz9dpqtR4Q4cAbHETomJOHC2AnhEi3PjuYhGHMbIRgtIg0XX4H/0u
+eHVvkb9xJ3SmmdidYTDlOFzLon8NqSZmmt6EDpDio62bDem49jUtnYmxJKXAxhL0
+jnwQ
+-----END CERTIFICATE-----
diff --git a/src/test/resources/local-cert/server.key b/src/test/resources/local-cert/server.key
new file mode 100644
index 0000000000..70c498c286
--- /dev/null
+++ b/src/test/resources/local-cert/server.key
@@ -0,0 +1,28 @@
+-----BEGIN PRIVATE KEY-----
+MIIEvQIBADANBgkqhkiG9w0BAQEFAASCBKcwggSjAgEAAoIBAQC+S+1jDLuOdI9g
+zn0RWxFKNM7xaxcdWz9Qn42z7tGJN5vaFQ53iWHfxM6H1iuL/tYjkSOJ/rgUvpvU
+oRZF737rRAog4HT7sNSmdeiaKwPpPK3BXxHwFIRni8tsxRWLOv3ll77DpLMw+yFK
+8cEwhtRGKa2ZjWMGCUfK0RNEGM7V60bXbRHUzjkYl/FXysgM6AzoWSw6dYtB4rN4
+YoF/S+zkyVPP8YOz9ilfJ2Dvv1A6YkBBaPvwQx163CZQ/CekLSRo7d2eUP6bMOt9
+5KSiuunlQqKPWTiza0b4T9UiyQbK5z8xJTp1zz8QLO4rtz9SOlTP2iFJ8vCFIZ2O
+fHSqNeaTAgMBAAECggEACY0zFaEqetyD49aJdYkOJZzf9EMtTlZpp6jSioEGuG33
+nysmZj6ZkItG2I+Z8PVyFyfuUjtcTwJAPRx2yzzZsIJiRcMubAG0ssRBUBevoxHe
+INIeSuAkwzPDmqqLycjEvLTwqM5IBkHcqm/XBBIIbpsh8Q6lNUTa+yWiY20hWKBX
+7I+mNg9qTsGkYCthZVBgkpmg3DCCX4l8hraHhev3KgdpaILaDSVqjd1IBwJ9ynJc
+mJ0/pvIVO7dwxJ7t7b+vNp8iJQjPlOZmz6hWKyFMhxnkOcri3OBYcr1JMkVZ38RD
+OjKhaaCnhhSH+IxwLxQQAs//S+EN3l6kOngN5cZ/aQKBgQDiEqp7kT7nAPRMq9Af
+okomKnQIpAuEfOauzH02PGkVYawCulWmr+FqdUZxz5SgPEp55IyTfD6iPaSb6QcO
+QuH3PvtZyVQv1ZrExquvd/3lS/cQwaDzV4YG46fBbw9K72BHkVV7dkxm+0p4Imid
+2XLRqT86difx1etovb7fzMXsCwKBgQDXfNh5Gk250Upyh3+7FDYr7bOvc0l9y/Xn
+eODM/yRI3MLaGTUXu90MK50AsOqxedvs4x5NvqG/n2Cr536b9C0tr09CfHeGsOMG
+OEfzxMrRv78ItBF7vLELYz1szi6JEZCeK1whgJ1osrTGWAhWkMTIErh3UOfZGgYG
+qFQGRFP8mQKBgG7FlqNVV+z4mru2tBPMAWkSBCj3uG0ChkXADNo2X4cKhK4Rf0Zd
+h6YSMKIzhC+/Wv6+7eKWTlpQugdq9voV64KqaZ5k98s4bs1cS2N+9/kSb8zWE3co
+u5NEmT4+nM+q2xI2NBx6qpULLEIRGhG+KnRw6XpLyubEWsTHtG8UdyZhAoGAVdm5
+bNYb7VICtQpiyyfMRUgYdGgb+XBO8f9ooINt81Fwl++/BUulT3n4vRO/DSIdio0Z
+v6OZUXyvyQ0blgp8DV1w2G46OIE0kX/OusHGhDY+Z7tF0+RjLMRG7pheVeGXmkxw
+EjDphZLdDsB34fUfUQ6US4UCOa5yhCiAAVcrltECgYEAlYNAELPKAcmWd+4G8Fr6
+07dIgJHZ7W45eZwwUwva9t09J/9d4wq7X4GaX98Jejdeh4nTHnBWX49m6EgQ0ccH
+4jcIvTj61aBuDNiW8p85O5gpBrCneFowFHsPElhG2nFSFhGtIST8fkiy5sBwxMFM
+1nauFIaX8tP0NxQDw+PvdDc=
+-----END PRIVATE KEY-----
diff --git a/src/test/resources/local-cert/server.p12 b/src/test/resources/local-cert/server.p12
new file mode 100644
index 0000000000..e6804a0f46
Binary files /dev/null and b/src/test/resources/local-cert/server.p12 differ
diff --git a/src/test/resources/local-cert/server.pfx b/src/test/resources/local-cert/server.pfx
new file mode 100644
index 0000000000..746aef2e35
Binary files /dev/null and b/src/test/resources/local-cert/server.pfx differ