From 54777687602faa8991364c42466c6c0b0e0c3084 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 9 Oct 2023 13:56:07 -0500
Subject: [PATCH 01/65] first test

---
 source/batch-mode.txt                                | 12 ++++++++++++
 .../read.txt => batch-mode/batch-read-config.txt}    |  2 --
 .../batch-read.txt}                                  |  5 ++++-
 .../write.txt => batch-mode/batch-write-config.txt}  |  0
 source/batch-mode/batch-write.txt                    |  0
 5 files changed, 16 insertions(+), 3 deletions(-)
 create mode 100644 source/batch-mode.txt
 rename source/{configuration/read.txt => batch-mode/batch-read-config.txt} (99%)
 rename source/{read-from-mongodb.txt => batch-mode/batch-read.txt} (94%)
 rename source/{configuration/write.txt => batch-mode/batch-write-config.txt} (100%)
 create mode 100644 source/batch-mode/batch-write.txt
diff --git a/source/batch-mode.txt b/source/batch-mode.txt
new file mode 100644
index 00000000..83443fbd
--- /dev/null
+++ b/source/batch-mode.txt
@@ -0,0 +1,12 @@
+==========
+Batch Mode
+==========
+
+.. meta::
+   :description: Use the {+connector-long+} to read and write batches of data. 
+
+.. toctree::
+   :caption: Batch Mode
+
+   /batch-mode/batch-read
+   /batch-mode/batch-write
diff --git a/source/configuration/read.txt b/source/batch-mode/batch-read-config.txt
similarity index 99%
rename from source/configuration/read.txt
rename to source/batch-mode/batch-read-config.txt
index 649be7d0..b35ad9f7 100644
--- a/source/configuration/read.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -4,8 +4,6 @@
 Read Configuration Options
 ==========================
 
-.. default-domain:: mongodb
-
 .. contents:: On this page
    :local:
    :backlinks: none
diff --git a/source/read-from-mongodb.txt b/source/batch-mode/batch-read.txt
similarity index 94%
rename from source/read-from-mongodb.txt
rename to source/batch-mode/batch-read.txt
index 4fdca2db..4539834d 100644
--- a/source/read-from-mongodb.txt
+++ b/source/batch-mode/batch-read.txt
@@ -7,7 +7,10 @@
 Read from MongoDB
 =================
 
-.. default-domain:: mongodb
+.. toctree::
+   :caption: Read Configuration Options
+
+   /./batch-read-config.txt
 
 .. contents:: On this page
    :local:
diff --git a/source/configuration/write.txt b/source/batch-mode/batch-write-config.txt
similarity index 100%
rename from source/configuration/write.txt
rename to source/batch-mode/batch-write-config.txt
diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
new file mode 100644
index 00000000..e69de29b

From 83ebbd1ab951a876d135628977d75ae3e83e6357 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 9 Oct 2023 14:38:40 -0500
Subject: [PATCH 02/65] fix

---
 source/index.txt | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/source/index.txt b/source/index.txt
index 35c24014..5ef12bee 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -47,10 +47,8 @@ versions of Apache Spark and MongoDB:
 .. toctree::
    :titlesonly:
 
-   configuration
    getting-started
-   write-to-mongodb
-   read-from-mongodb
+   batch-mode
    structured-streaming
    faq
    release-notes

From 79cd1580743d613aa90929278221d62d796b43df Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 9 Oct 2023 14:44:44 -0500
Subject: [PATCH 03/65] fix

---
 source/configuration.txt | 6 ------
 source/index.txt         | 2 +-
 2 files changed, 1 insertion(+), 7 deletions(-)

diff --git a/source/configuration.txt b/source/configuration.txt
index efe84e90..b4486ae4 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -156,9 +156,3 @@ properly:
 
 - :ref:`SparkConf <spark-conf>`
 - :ref:`Options maps <options-map>`
-
-.. toctree::
-   :titlesonly:
-
-   configuration/write
-   configuration/read
diff --git a/source/index.txt b/source/index.txt
index 5ef12bee..b70db4e2 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -48,7 +48,7 @@ versions of Apache Spark and MongoDB:
    :titlesonly:
 
    getting-started
-   batch-mode
+   /batch-mode
    structured-streaming
    faq
    release-notes

From 7e1df0e181ac1ebab1457365ac5866c368f675b4 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 9 Oct 2023 14:54:38 -0500
Subject: [PATCH 04/65] test

---
 source/batch-mode/batch-read.txt  |  2 +-
 source/batch-mode/batch-write.txt | 49 +++++++++++++++++++++++++++++++
 source/write-to-mongodb.txt       | 49 -------------------------------
 3 files changed, 50 insertions(+), 50 deletions(-)
 delete mode 100644 source/write-to-mongodb.txt

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 4539834d..e08918cb 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -10,7 +10,7 @@ Read from MongoDB
 .. toctree::
    :caption: Read Configuration Options
 
-   /./batch-read-config.txt
+   /batch-mode/batch-read-config
 
 .. contents:: On this page
    :local:
diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index e69de29b..31f44197 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -0,0 +1,49 @@
+.. _write-to-mongodb:
+.. _scala-write:
+.. _java-write:
+
+================
+Write to MongoDB
+================
+
+.. default-domain:: mongodb
+
+.. tabs-selector:: drivers
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         .. include:: /java/write-to-mongodb.txt
+
+     - id: python
+       content: |
+
+         .. include:: /python/write-to-mongodb.txt
+
+     - id: scala
+       content: |
+
+         .. include:: /scala/write-to-mongodb.txt
+
+.. warning:: Setting the Write Mode to ``overwrite``
+
+   If you specify the ``overwrite`` write mode, the connector drops the target
+   collection and creates a new collection that uses the
+   default collection options.
+   This behavior can affect collections that don't use the default options,
+   such as the following collection types:
+
+   - Sharded collections
+   - Collections with non-default collations
+   - Time-series collections
+
+.. important::
+
+   If your write operation includes a field with a ``null`` value,
+   the connector writes the field name and ``null`` value to MongoDB. You can
+   change this behavior by setting the write configuration property
+   ``ignoreNullValues``. For more information about setting the connector's
+   write behavior, see :ref:`Write Configuration Options <spark-write-conf>`.
diff --git a/source/write-to-mongodb.txt b/source/write-to-mongodb.txt
deleted file mode 100644
index 31f44197..00000000
--- a/source/write-to-mongodb.txt
+++ /dev/null
@@ -1,49 +0,0 @@
-.. _write-to-mongodb:
-.. _scala-write:
-.. _java-write:
-
-================
-Write to MongoDB
-================
-
-.. default-domain:: mongodb
-
-.. tabs-selector:: drivers
-
-.. tabs-drivers::
-
-   tabs:
-     - id: java-sync
-       content: |
-
-         .. include:: /java/write-to-mongodb.txt
-
-     - id: python
-       content: |
-
-         .. include:: /python/write-to-mongodb.txt
-
-     - id: scala
-       content: |
-
-         .. include:: /scala/write-to-mongodb.txt
-
-.. warning:: Setting the Write Mode to ``overwrite``
-
-   If you specify the ``overwrite`` write mode, the connector drops the target
-   collection and creates a new collection that uses the
-   default collection options.
-   This behavior can affect collections that don't use the default options,
-   such as the following collection types:
-
-   - Sharded collections
-   - Collections with non-default collations
-   - Time-series collections
-
-.. important::
-
-   If your write operation includes a field with a ``null`` value,
-   the connector writes the field name and ``null`` value to MongoDB. You can
-   change this behavior by setting the write configuration property
-   ``ignoreNullValues``. For more information about setting the connector's
-   write behavior, see :ref:`Write Configuration Options <spark-write-conf>`.

From b20a31abe209760b102f1c10214f44077e6d0e95 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 9 Oct 2023 15:04:45 -0500
Subject: [PATCH 05/65] add streaming

---
 source/batch-mode/batch-write.txt             |   5 +-
 source/streaming-mode.txt                     |  12 +
 .../streaming-mode/streaming-read-config.txt  | 421 ++++++++++++++++++
 source/streaming-mode/streaming-read.txt      |  79 ++++
 .../streaming-mode/streaming-write-config.txt | 203 +++++++++
 source/streaming-mode/streaming-write.txt     |  52 +++
 6 files changed, 771 insertions(+), 1 deletion(-)
 create mode 100644 source/streaming-mode.txt
 create mode 100644 source/streaming-mode/streaming-read-config.txt
 create mode 100644 source/streaming-mode/streaming-read.txt
 create mode 100644 source/streaming-mode/streaming-write-config.txt
 create mode 100644 source/streaming-mode/streaming-write.txt

diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 31f44197..5b074001 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -6,7 +6,10 @@
 Write to MongoDB
 ================
 
-.. default-domain:: mongodb
+.. toctree::
+   :caption: Read Configuration Options
+
+   /batch-mode/batch-write-config
 
 .. tabs-selector:: drivers
 
diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
new file mode 100644
index 00000000..931cc197
--- /dev/null
+++ b/source/streaming-mode.txt
@@ -0,0 +1,12 @@
+==============
+Streaming Mode
+==============
+
+.. meta::
+   :description: Use the {+connector-long+} to stream data. 
+
+.. toctree::
+   :caption: Streaming Mode
+
+   /streaming-mode/streaming-read
+   /streaming-mode/streaming-write
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
new file mode 100644
index 00000000..cf99d709
--- /dev/null
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -0,0 +1,421 @@
+.. _spark-streaming-read-conf:
+
+==========================
+Read Configuration Options
+==========================
+
+.. contents:: On this page
+   :local:
+   :backlinks: none
+   :depth: 1
+   :class: singlecol
+
+.. _spark-streaming-input-conf:
+
+Read Configuration
+------------------
+
+You can configure the following properties to read from MongoDB:
+
+.. note::
+
+   If you use ``SparkConf`` to set the connector's read configurations,
+   prefix ``spark.mongodb.read.`` to each property.
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+   
+   * - ``connection.uri``
+     - | **Required.**
+       | The connection string configuration key.
+       |
+       | **Default:** ``mongodb://localhost:27017/``
+
+   * - ``database``
+     - | **Required.**
+       | The database name configuration.
+
+   * - ``collection``
+     - | **Required.**
+       | The collection name configuration.
+
+   * - ``comment``
+     - | The comment to append to the read operation. Comments appear in the 
+         :manual:`output of the Database Profiler. </reference/database-profiler>`
+       |
+       | **Default:** None 
+
+   * - ``mongoClientFactory``
+     - | MongoClientFactory configuration key.
+       | You can specify a custom implementation which must implement the
+         ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
+         interface.
+       |
+       | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
+
+   * - ``partitioner``
+     - | The partitioner full class name.
+
+       | You can specify a custom implementation which must implement the
+         ``com.mongodb.spark.sql.connector.read.partitioner.Partitioner``
+          interface.
+       | See the
+         :ref:`Partitioner Configuration <partitioner-conf>` section for more
+         information on partitioners.
+       |
+       | **Default:** ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``
+
+   * - ``partitioner.options.``
+     - | Partitioner configuration prefix.
+       | See the
+         :ref:`Partitioner Configuration <partitioner-conf>` section for more
+         information on partitioners.
+
+   * - ``sampleSize``
+     - | The number of documents to sample from the collection when inferring
+       | the schema.
+       |
+       | **Default:** ``1000``
+
+   * - ``sql.inferSchema.mapTypes.enabled``
+     - | Whether to enable Map types when inferring the schema.
+       | When enabled, large compatible struct types are inferred to a
+         ``MapType`` instead.
+       |
+       | **Default:** ``true``
+
+   * - ``sql.inferSchema.mapTypes.minimum.key.size``
+     - | Minimum size of a ``StructType`` before inferring as a ``MapType``.
+       |
+       | **Default:** ``250``
+
+   * - ``aggregation.pipeline``
+     - | Specifies a custom aggregation pipeline to apply to the collection
+         before sending data to Spark.
+       | The value must be either an extended JSON single document or list
+         of documents.
+       | A single document should resemble the following:
+
+       .. code-block:: json
+
+          {"$match": {"closed": false}}
+
+       | A list of documents should resemble the following:
+
+       .. code-block:: json
+
+          [{"$match": {"closed": false}}, {"$project": {"status": 1, "name": 1, "description": 1}}]
+
+       .. important::
+
+          Custom aggregation pipelines must be compatible with the
+          partitioner strategy. For example, aggregation stages such as
+          ``$group`` do not work with any partitioner that creates more than
+          one partition.
+
+   * - ``aggregation.allowDiskUse``
+     - | Specifies whether to allow storage to disk when running the
+         aggregation.
+       |
+       | **Default:** ``true``
+
+   * - ``outputExtendedJson``
+     - | When ``true``, the connector converts BSON types not supported by Spark into 
+         extended JSON strings.
+         When ``false``, the connector uses the original relaxed JSON format for 
+         unsupported types.
+       |
+       | **Default:** ``false``
+
+.. _partitioner-conf:
+
+Partitioner Configurations
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Partitioners change the read behavior for batch reads with the {+connector-short+}.
+They do not affect Structured Streaming because the data stream processing
+engine produces a single stream with Structured Streaming.
+
+This section contains configuration information for the following 
+partitioners:
+
+- :ref:`SamplePartitioner <conf-samplepartitioner>`
+- :ref:`ShardedPartitioner <conf-shardedpartitioner>`
+- :ref:`PaginateBySizePartitioner <conf-paginatebysizepartitioner>`
+- :ref:`PaginateIntoPartitionsPartitioner <conf-paginateintopartitionspartitioner>`
+- :ref:`SinglePartitionPartitioner <conf-singlepartitionpartitioner>`
+
+.. _conf-mongosamplepartitioner:
+.. _conf-samplepartitioner:
+
+``SamplePartitioner`` Configuration
+```````````````````````````````````
+
+.. include:: /includes/sparkconf-partitioner-options-note.rst
+
+You must specify this partitioner using the full classname:
+``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``.
+
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+
+   * - ``partitioner.options.partition.field``
+     - The field to use for partitioning, which must be a unique field.
+
+       **Default:** ``_id``
+
+   * - ``partitioner.options.partition.size``
+     - The size (in MB) for each partition. Smaller partition sizes
+       create more partitions containing fewer documents.
+
+       **Default:** ``64``
+
+
+   * - ``partitioner.options.samples.per.partition``
+     - The number of samples to take per partition. The total number of
+       samples taken is:
+
+       .. code-block:: none
+
+          samples per partition * ( count / number of documents per partition)
+
+       **Default:** ``10``
+
+.. example::
+
+   For a collection with 640 documents with an average document
+   size of 0.5 MB, the default SamplePartitioner configuration values creates
+   5 partitions with 128 documents per partition.
+
+   The MongoDB Spark Connector samples 50 documents (the default 10
+   per intended partition) and defines 5 partitions by selecting
+   partition field ranges from the sampled documents.
+
+.. _conf-mongoshardedpartitioner:
+.. _conf-shardedpartitioner:
+
+``ShardedPartitioner`` Configuration
+`````````````````````````````````````
+
+The ``ShardedPartitioner`` automatically determines the partitions to use
+based on your shard configuration.
+
+You must specify this partitioner using the full classname:
+``com.mongodb.spark.sql.connector.read.partitioner.ShardedPartitioner``.
+
+.. warning::
+
+   This partitioner is not compatible with hashed shard keys.
+
+
+.. _conf-mongopaginatebysizepartitioner:
+.. _conf-paginatebysizepartitioner:
+
+``PaginateBySizePartitioner`` Configuration
+```````````````````````````````````````````
+
+.. include:: /includes/sparkconf-partitioner-options-note.rst
+
+You must specify this partitioner using the full classname:
+``com.mongodb.spark.sql.connector.read.partitioner.PaginateBySizePartitioner``.
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+
+   * - ``partitioner.options.partition.field``
+     - The field to use for partitioning, which must be a unique field.
+
+       **Default:** ``_id``
+
+   * - ``partitioner.options.partition.size``
+     - The size (in MB) for each partition. Smaller partition sizes
+
+       create more partitions containing fewer documents.
+
+       **Default:** ``64``
+
+.. _conf-paginateintopartitionspartitioner:
+
+``PaginateIntoPartitionsPartitioner`` Configuration
+```````````````````````````````````````````````````
+
+.. include:: /includes/sparkconf-partitioner-options-note.rst
+
+You must specify this partitioner using the full classname:
+``com.mongodb.spark.sql.connector.read.partitioner.PaginateIntoPartitionsPartitioner``.
+
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+     
+   * - ``partitioner.options.partition.field``
+     - The field to use for partitioning, which must be a unique field.
+
+       **Default:** ``_id``
+
+   * - ``partitioner.options.maxNumberOfPartitions``
+     - The number of partitions to create.
+
+       **Default:** ``64``
+
+.. _conf-singlepartitionpartitioner:
+
+``SinglePartitionPartitioner`` Configuration
+````````````````````````````````````````````
+
+.. include:: /includes/sparkconf-partitioner-options-note.rst
+
+You must specify this partitioner using the full classname:
+``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
+
+This partitioner creates a single partition.
+
+.. _spark-change-stream-conf:
+
+Change Streams
+--------------
+
+.. note::
+
+   If you use ``SparkConf`` to set the connector's change stream
+   configurations, prefix ``spark.mongodb.`` to each property.
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+
+   * - ``change.stream.lookup.full.document``
+
+     - Determines what values your change stream returns on update
+       operations.
+
+       The default setting returns the differences between the original
+       document and the updated document.
+
+       The ``updateLookup`` setting returns the differences between the
+       original document and updated document as well as a copy of the
+       entire updated document.
+
+       **Default:** "default"
+
+       .. tip::
+
+          For more information on how this change stream option works,
+          see the MongoDB server manual guide
+          :manual:`Lookup Full Document for Update Operation </changeStreams/#lookup-full-document-for-update-operations>`.
+
+   * - ``change.stream.micro.batch.max.partition.count``
+     - | The maximum number of partitions the {+connector-short+} divides each 
+         micro-batch into. Spark workers can process these partitions in parallel.
+       |  
+       | This setting applies only when using micro-batch streams.
+       |
+       | **Default**: ``1``
+
+       .. warning:: Event Order
+
+          Specifying a value larger than ``1`` can alter the order in which
+          the {+connector-short+} processes change events. Avoid this setting
+          if out-of-order processing could create data inconsistencies downstream. 
+
+   * - ``change.stream.publish.full.document.only``
+     - | Specifies whether to publish the changed document or the full
+         change stream document.
+       |
+       | When this setting is ``true``, the connector exhibits the following behavior:
+       
+       - The connector filters out messages that
+         omit the ``fullDocument`` field and only publishes the value of the
+         field.
+       - If you don't specify a schema, the connector infers the schema
+         from the change stream document rather than from the underlying collection.
+
+         **Default**: ``false``
+       
+       .. note::
+
+          This setting overrides the ``change.stream.lookup.full.document``
+          setting.
+
+   * - ``change.stream.startup.mode``
+     - | Specifies how the connector starts up when no offset is available.
+       
+       | This setting accepts the following values:
+        
+       - ``latest``: The connector begins processing
+         change events starting with the most recent event.
+         It will not process any earlier unprocessed events.
+       - ``timestamp``: The connector begins processing change events at a specified time.
+           
+         To use the ``timestamp`` option, you must specify a time by using the
+         ``change.stream.startup.mode.timestamp.start.at.operation.time`` setting.
+         This setting accepts timestamps in the following formats:
+         
+         - An integer representing the number of seconds since the
+           :wikipedia:`Unix epoch <Unix_time>`
+         - A date and time in
+           `ISO-8601 <https://www.iso.org/iso-8601-date-and-time-format.html>`__
+           format with one-second precision
+         - An extended JSON ``BsonTimestamp``
+       
+         **Default**: ``latest``
+       
+.. _configure-input-uri:
+
+``connection.uri`` Configuration Setting
+----------------------------------------
+
+You can set all :ref:`spark-input-conf` via the read ``connection.uri`` setting.
+
+For example, consider the following example which sets the read
+``connection.uri`` setting:
+
+.. note::
+
+   If you use ``SparkConf`` to set the connector's read configurations,
+   prefix ``spark.mongodb.read.`` to the setting.
+
+.. code:: cfg
+
+   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/databaseName.collectionName?readPreference=primaryPreferred
+
+
+The configuration corresponds to the following separate configuration
+settings:
+
+.. code:: cfg
+
+   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
+   spark.mongodb.read.database=databaseName
+   spark.mongodb.read.collection=collectionName
+   spark.mongodb.read.readPreference.name=primaryPreferred
+
+If you specify a setting both in the ``connection.uri`` and in a separate
+configuration, the ``connection.uri`` setting overrides the separate
+setting. For example, given the following configuration, the
+database for the connection is ``foobar``:
+
+.. code:: cfg
+
+   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/foobar
+   spark.mongodb.read.database=bar
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
new file mode 100644
index 00000000..f5d2d992
--- /dev/null
+++ b/source/streaming-mode/streaming-read.txt
@@ -0,0 +1,79 @@
+.. _read-from-mongodb: 
+.. _scala-read:
+.. _java-read:
+.. _scala-dataset-filters:
+
+=================
+Read from MongoDB
+=================
+
+.. toctree::
+   :caption: Read Configuration Options
+
+   /streaming-mode/streaming-read-config
+
+.. contents:: On this page
+   :local:
+   :backlinks: none
+   :depth: 1
+   :class: singlecol 
+
+Overview
+--------
+
+.. tabs-selector:: drivers
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         .. include:: /java/read-from-mongodb.txt
+
+     - id: python
+       content: |
+
+         .. include:: /python/read-from-mongodb.txt
+
+         .. include:: /python/filters.txt
+
+     - id: scala
+       content: |
+
+         .. include:: /scala/read-from-mongodb.txt
+
+         .. include:: /scala/filters.txt
+
+.. important:: Inferring the Schema of a Change Stream
+
+   When the {+connector-short+} infers the schema of a data frame 
+   read from a change stream, by default,
+   it will use the schema of the underlying collection rather than that
+   of the change stream. If you set the ``change.stream.publish.full.document.only``
+   option to ``true``, the connector uses the schema of the 
+   change stream instead.
+
+   For more information on configuring a read operation, see the
+   :ref:`spark-change-stream-conf` section of the Read Configuration Options guide.
+
+SQL Queries
+-----------
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         .. include:: /java/sql.txt
+
+     - id: python
+       content: |
+
+         .. include:: /python/sql.txt
+
+     - id: scala
+       content: |
+
+         .. include:: /scala/sql.txt
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
new file mode 100644
index 00000000..ce4404ce
--- /dev/null
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -0,0 +1,203 @@
+.. _spark-write-conf:
+
+===========================
+Write Configuration Options
+===========================
+
+.. contents:: On this page
+   :local:
+   :backlinks: none
+   :depth: 1
+   :class: singlecol
+
+.. _spark-output-conf:
+
+Write Configuration
+-------------------
+
+The following options for writing to MongoDB are available:
+
+.. note::
+
+   If you use ``SparkConf`` to set the connector's write configurations,
+   prefix ``spark.mongodb.write.`` to each property.
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+   
+   * - ``connection.uri``
+     - | **Required.**
+       | The connection string configuration key.
+       |
+       | **Default:** ``mongodb://localhost:27017/``
+
+   * - ``database``
+     - | **Required.**
+       | The database name configuration.
+
+   * - ``collection``
+     - | **Required.**
+       | The collection name configuration.
+
+   * - ``comment``
+     - | The comment to append to the write operation. Comments appear in the 
+         :manual:`output of the Database Profiler. </reference/database-profiler>`
+       |
+       | **Default:** None 
+
+   * - ``convertJson``
+     - | Specifies whether the connector parses the string and converts extended JSON
+         into BSON.
+       |
+       | This setting accepts the following values:
+       
+       - ``any``: The connector converts all JSON values to BSON.
+
+         - ``"{a: 1}"`` becomes ``{a: 1}``.
+         - ``"[1, 2, 3]"`` becomes ``[1, 2, 3]``.
+         - ``"true"`` becomes ``true``.
+         - ``"01234"`` becomes ``1234``.
+         - ``"{a:b:c}"`` doesn't change.
+
+       - ``objectOrArrayOnly``: The connector converts only JSON objects and arrays to
+         BSON.
+
+         - ``"{a: 1}"`` becomes ``{a: 1}``. 
+         - ``"[1, 2, 3]"`` becomes ``[1, 2, 3]``. 
+         - ``"true"`` doesn't change.
+         - ``"01234"`` doesn't change.
+         - ``"{a:b:c}"`` doesn't change.
+
+       - ``false``: The connector leaves all values as strings.
+
+       | **Default:** ``false``
+   
+   * - ``idFieldList``
+     - | Field or list of fields by which to split the collection data. To
+         specify more than one field, separate them using a comma as shown
+         in the following example:
+
+       .. code-block:: none
+          :copyable: false
+
+          "fieldName1,fieldName2"
+
+       | **Default:** ``_id``
+
+   * - ``ignoreNullValues``
+     - | When ``true``, the connector ignores any ``null`` values when writing,
+         including ``null`` values in arrays and nested documents.
+       |
+       | **Default:** ``false``
+
+   * - ``maxBatchSize``
+     - | Specifies the maximum number of operations to batch in bulk
+         operations.
+       |
+       | **Default:** ``512``
+
+   * - ``mongoClientFactory``
+     - | MongoClientFactory configuration key.
+       | You can specify a custom implementation which must implement the
+         ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
+         interface.
+       |
+       | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
+
+   * - ``operationType``
+     - | Specifies the type of write operation to perform. You can set
+         this to one of the following values:
+
+       - ``insert``: Insert the data.
+       - ``replace``: Replace an existing document that matches the
+         ``idFieldList`` value with the new data. If no match exists, the
+         value of ``upsertDocument`` indicates whether the connector
+         inserts a new document.
+       - ``update``: Update an existing document that matches the
+         ``idFieldList`` value with the new data. If no match exists, the
+         value of ``upsertDocument`` indicates whether the connector
+         inserts a new document.
+
+       |
+       | **Default:** ``replace``
+
+   * - ``ordered``
+     - | Specifies whether to perform ordered bulk operations.
+       |
+       | **Default:** ``true``
+
+   * - ``upsertDocument``
+     - | When ``true``, replace and update operations will insert the data
+         if no match exists.
+       |
+       | For time series collections, you must set ``upsertDocument`` to
+         ``false``.
+       |
+       | **Default:** ``true``
+
+   * - ``writeConcern.journal``
+     - | Specifies ``j``, a write-concern option to enable request for
+         acknowledgment that the data is confirmed on on-disk journal for
+         the criteria specified in the ``w`` option. You can specify
+         either ``true`` or ``false``.
+       |
+       | For more information on ``j`` values, see the MongoDB server
+         guide on the
+         :manual:`WriteConcern j option </reference/write-concern/#j-option>`.
+
+   * - ``writeConcern.w``
+     - | Specifies ``w``, a write-concern option to request acknowledgment
+         that the write operation has propagated to a specified number of
+         MongoDB nodes. For a list
+         of allowed values for this option, see :manual:`WriteConcern
+         </reference/write-concern/#w-option>` in the MongoDB manual.
+       |
+       | **Default:** ``1``
+
+   * - ``writeConcern.wTimeoutMS``
+     - | Specifies ``wTimeoutMS``, a write-concern option to return an error
+         when a write operation exceeds the number of milliseconds. If you
+         use this optional setting, you must specify a nonnegative integer.
+       |
+       | For more information on ``wTimeoutMS`` values, see the MongoDB server
+         guide on the
+         :manual:`WriteConcern wtimeout option </reference/write-concern/#wtimeout>`.
+
+.. _configure-output-uri:
+
+``connection.uri`` Configuration Setting
+----------------------------------------
+
+You can set all :ref:`spark-output-conf` via the write ``connection.uri``.
+
+.. note::
+
+   If you use ``SparkConf`` to set the connector's write configurations,
+   prefix ``spark.mongodb.write.`` to the setting.
+
+.. code:: cfg
+
+  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection
+
+The configuration corresponds to the following separate configuration
+settings:
+
+.. code:: cfg
+
+  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
+   spark.mongodb.write.database=test
+   spark.mongodb.write.collection=myCollection
+
+If you specify a setting both in the ``connection.uri`` and in a separate
+configuration, the ``connection.uri`` setting overrides the separate
+setting. For example, in the following configuration, the
+database for the connection is ``foobar``:
+
+.. code:: cfg
+
+  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
+   spark.mongodb.write.database=bar
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
new file mode 100644
index 00000000..b44aee73
--- /dev/null
+++ b/source/streaming-mode/streaming-write.txt
@@ -0,0 +1,52 @@
+.. _write-to-mongodb:
+.. _scala-write:
+.. _java-write:
+
+================
+Write to MongoDB
+================
+
+.. toctree::
+   :caption: Read Configuration Options
+
+   /streaming-mode/streaming-write-config
+
+.. tabs-selector:: drivers
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         .. include:: /java/write-to-mongodb.txt
+
+     - id: python
+       content: |
+
+         .. include:: /python/write-to-mongodb.txt
+
+     - id: scala
+       content: |
+
+         .. include:: /scala/write-to-mongodb.txt
+
+.. warning:: Setting the Write Mode to ``overwrite``
+
+   If you specify the ``overwrite`` write mode, the connector drops the target
+   collection and creates a new collection that uses the
+   default collection options.
+   This behavior can affect collections that don't use the default options,
+   such as the following collection types:
+
+   - Sharded collections
+   - Collections with non-default collations
+   - Time-series collections
+
+.. important::
+
+   If your write operation includes a field with a ``null`` value,
+   the connector writes the field name and ``null`` value to MongoDB. You can
+   change this behavior by setting the write configuration property
+   ``ignoreNullValues``. For more information about setting the connector's
+   write behavior, see :ref:`Write Configuration Options <spark-write-conf>`.

From d7292d7123d623152615e4bdd8081572aa4b0be9 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 10 Oct 2023 16:53:44 -0500
Subject: [PATCH 06/65] cache config

---
 source/configuration.txt | 38 ++++++++------------------------------
 source/faq.txt           | 29 +++++++++++++++++++++++++----
 source/index.txt         |  1 +
 3 files changed, 34 insertions(+), 34 deletions(-)

diff --git a/source/configuration.txt b/source/configuration.txt
index b4486ae4..9442acee 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -1,8 +1,8 @@
-=====================
-Configuration Options
-=====================
+.. _configuration:
 
-.. default-domain:: mongodb
+=================
+Configuring Spark
+=================
 
 .. contents:: On this page
    :local:
@@ -118,34 +118,12 @@ specifying an option key string.
 Using a System Property
 ~~~~~~~~~~~~~~~~~~~~~~~
 
-The connector provides a cache for ``MongoClients`` which can only be
-configured with a System Property. See :ref:`cache-configuration`.
+The {+connector-short+} reads some configuration settings before ``SparkConf`` is
+available. You must specify these settings by using a JVM system property.
 
-.. _cache-configuration:
+.. tip:: System Properties
 
-Cache Configuration
--------------------
-
-The MongoConnector includes a cache for MongoClients, so workers can
-share the MongoClient across threads.
-
-.. important::
-
-   As the cache is setup before the Spark Configuration is available,
-   the cache can only be configured with a System Property.
-
-.. list-table::
-   :header-rows: 1
-   :widths: 35 65
-
-   * - System Property name
-     - Description
-
-   * - ``mongodb.keep_alive_ms``
-     - The length of time to keep a ``MongoClient`` available for 
-       sharing.
-
-       **Default:** ``5000``
+   For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
 
 ``ConfigException``\s
 ---------------------
diff --git a/source/faq.txt b/source/faq.txt
index 6fefa7a4..d3d3c270 100644
--- a/source/faq.txt
+++ b/source/faq.txt
@@ -49,7 +49,28 @@ To use mTLS, include the following options when you run ``spark-submit``:
    --driver-java-options -Djavax.net.ssl.trustStorePassword=<your truststore password> \
    --driver-java-options -Djavax.net.ssl.keyStore=<path to your keystore.jks file> \
    --driver-java-options -Djavax.net.ssl.keyStorePassword=<your keystore password> \
-   -conf spark.executor.extraJavaOptions=-Djavax.net.ssl.trustStore=<path to your truststore.jks file> \
-   -conf spark.executor.extraJavaOptions=-Djavax.net.ssl.trustStorePassword=<your truststore password> \
-   -conf spark.executor.extraJavaOptions=-Djavax.net.ssl.keyStore=<path to your keystore.jks file> \
-   -conf spark.executor.extraJavaOptions=-Djavax.net.ssl.keyStorePassword=<your keystore password> \
\ No newline at end of file
+   --conf spark.executor.extraJavaOptions=-Djavax.net.ssl.trustStore=<path to your truststore.jks file> \
+   --conf spark.executor.extraJavaOptions=-Djavax.net.ssl.trustStorePassword=<your truststore password> \
+   --conf spark.executor.extraJavaOptions=-Djavax.net.ssl.keyStore=<path to your keystore.jks file> \
+   --conf spark.executor.extraJavaOptions=-Djavax.net.ssl.keyStorePassword=<your keystore password> \
+
+.. _cache-configuration:
+
+How can I share a MongoClient instance across threads?
+------------------------------------------------------
+
+The MongoConnector includes a cache that lets workers
+share a single ``MongoClient`` across threads. To specify the length of time to keep a
+``MongoClient`` available, include the ``mongodb.keep_alive_ms`` option when you run
+``spark-submit``:
+
+.. code-block:: bash
+
+   --driver-java-options -Dmongodb.keep_alive_ms=<number of milliseconds to keep MongoClient available>
+
+By default, this property has a value of ``5000``.
+
+.. note::
+
+   Because the cache is set up before the Spark Configuration is available,
+   you must use a system property to configure it.
\ No newline at end of file
diff --git a/source/index.txt b/source/index.txt
index b70db4e2..1880e87a 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -48,6 +48,7 @@ versions of Apache Spark and MongoDB:
    :titlesonly:
 
    getting-started
+   configuration
    /batch-mode
    structured-streaming
    faq

From 4a4f5813b1487845c779feabc7d95e66120f096f Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 10 Oct 2023 16:55:53 -0500
Subject: [PATCH 07/65] remove configexception

---
 source/configuration.txt | 12 +-----------
 1 file changed, 1 insertion(+), 11 deletions(-)

diff --git a/source/configuration.txt b/source/configuration.txt
index 9442acee..8ecf00fb 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -123,14 +123,4 @@ available. You must specify these settings by using a JVM system property.
 
 .. tip:: System Properties
 
-   For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
-
-``ConfigException``\s
----------------------
-
-A configuration error throws a ``ConfigException``. Confirm that any of 
-the following methods of configuration that you use are configured 
-properly:
-
-- :ref:`SparkConf <spark-conf>`
-- :ref:`Options maps <options-map>`
+   For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
\ No newline at end of file

From 2c921baec74df6e5134e15a7d533464634dae0f1 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 10 Oct 2023 16:59:04 -0500
Subject: [PATCH 08/65] add streaming to index

---
 source/index.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/source/index.txt b/source/index.txt
index 1880e87a..f8e6c808 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -50,6 +50,7 @@ versions of Apache Spark and MongoDB:
    getting-started
    configuration
    /batch-mode
+   /streaming-mode
    structured-streaming
    faq
    release-notes

From 7332e54f3a4f7b8bf68aa798b23f3c117419672a Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 10 Oct 2023 17:09:47 -0500
Subject: [PATCH 09/65] streaming mode

---
 source/streaming-mode.txt                 |  17 +
 source/streaming-mode/streaming-read.txt  | 394 ++++++++++-
 source/streaming-mode/streaming-write.txt | 325 +++++++++-
 source/structured-streaming.txt           | 755 ----------------------
 4 files changed, 694 insertions(+), 797 deletions(-)
 delete mode 100644 source/structured-streaming.txt

diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
index 931cc197..b0973255 100644
--- a/source/streaming-mode.txt
+++ b/source/streaming-mode.txt
@@ -2,6 +2,12 @@
 Streaming Mode
 ==============
 
+.. contents:: On this page
+   :local:
+   :backlinks: none
+   :depth: 2
+   :class: singlecol
+
 .. meta::
    :description: Use the {+connector-long+} to stream data. 
 
@@ -10,3 +16,14 @@ Streaming Mode
 
    /streaming-mode/streaming-read
    /streaming-mode/streaming-write
+
+Spark Structured Streaming is a data stream processing engine you can 
+use through the Dataset or DataFrame API. The MongoDB Spark Connector 
+enables you to stream to and from MongoDB using Spark Structured 
+Streaming.
+
+.. include:: includes/streaming-distinction.rst
+
+To learn more about Structured Streaming, see the 
+`Spark Programming Guide
+<https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index f5d2d992..e9f43358 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -2,6 +2,12 @@
 .. _scala-read:
 .. _java-read:
 .. _scala-dataset-filters:
+.. _streaming-read-from-mongodb: 
+.. _streaming-scala-read:
+.. _streaming-java-read:
+.. _streaming-scala-dataset-filters:
+.. _read-structured-stream:
+.. _continuous-processing:
 
 =================
 Read from MongoDB
@@ -21,59 +27,407 @@ Read from MongoDB
 Overview
 --------
 
-.. tabs-selector:: drivers
+When reading a stream from a MongoDB database, the {+connector-long+} supports both 
+*micro-batch processing* and 
+*continuous processing*. Micro-batch processing is the default processing engine, while
+continuous processing is an experimental feature introduced in 
+Spark version 2.3. To learn 
+more about continuous processing, see the `Spark documentation <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#continuous-processing>`__.
+
+.. include:: /includes/fact-read-from-change-stream
+
+.. note::
+
+    Since Structured Streaming produces a single partition, it ignores
+    :ref:`partitioner configurations <partitioner-conf>`. Partitioner
+    configuration only apply when there are multiple partitions. This is true
+    for both micro-batch processing and continuous processing streams.
 
 .. tabs-drivers::
 
    tabs:
+
      - id: java-sync
        content: |
 
-         .. include:: /java/read-from-mongodb.txt
+         To read data from MongoDB, specify the following read-stream configuration settings on 
+         `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__: 
+         
+         .. list-table::
+            :header-rows: 1
+            :stub-columns: 1
+            :widths: 10 40
+         
+            * - Setting
+              - Description
+         
+            * - ``readStream.format()``
+              - The format to use for read stream data. Use ``mongodb``.
+         
+            * - ``writeStream.trigger()``
+              - Specifies how often results should be 
+                written to the streaming sink. 
+                
+                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
+                as an argument, where ``<time value>`` is how often the Spark Connector 
+                should asynchronously checkpoint. If you 
+                pass any other static method of the ``Trigger`` class, or if you don't 
+                call ``writeStream.trigger()``, the Spark connector will use 
+                micro-batch processing instead. 
+  
+                To view a list of all supported processing policies, see `the Java 
+                trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
+
+                .. include:: /includes/note-trigger-method
+
+         The following code snippet shows how to use the preceding 
+         configuration settings to continuously process data streamed from MongoDB.
+         The connector appends all new data to the existing data and asynchronously 
+         writes checkpoints to ``/tmp/checkpointDir`` once per second:
+
+         .. code-block:: java
+            :copyable: true
+            :emphasize-lines: 1, 4, 8, 13
+
+            import org.apache.spark.sql.streaming.Trigger;
+ 
+            Dataset<Row> streamingDataset = <local SparkSession>.readStream()
+              .format("mongodb")
+              .load();
+ 
+            DataStreamWriter<Row> dataStreamWriter = streamingDataset.writeStream()
+              .trigger(Trigger.Continuous("1 second"))
+              .format("memory")
+              .option("checkpointLocation", "/tmp/checkpointDir")
+              .outputMode("append");
+ 
+            StreamingQuery query = dataStreamWriter.start();
+
+         .. note::
+            
+            Spark does not begin streaming until you call the 
+            ``start()`` method on a streaming query.
+
+         For a complete list of methods, see the 
+         `Java Structured Streaming reference <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__.
 
      - id: python
        content: |
 
-         .. include:: /python/read-from-mongodb.txt
+         To read data from MongoDB, specify the following read-stream configuration settings on 
+         `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__:  
+
+         To use continuous processing with the MongoDB Spark Connector, 
+         call the ``trigger()`` method on the ``writeStream`` property 
+         of the streaming DataFrame that you create from 
+         your MongoDB read stream. In your ``trigger()``, specify the 
+         ``continuous`` parameter.
+         
+         .. list-table::
+            :header-rows: 1
+            :stub-columns: 1
+            :widths: 10 40
+         
+            * - Setting
+              - Description
+         
+            * - ``readStream.format()``
+              - The format to use for read stream data. Use ``mongodb``.
+         
+            * - ``writeStream.trigger()``
+              - Specifies how often results should be 
+                written to the streaming sink. 
+
+                To use continuous processing, pass the method a time value 
+                using the ``continuous`` parameter.
+                If you pass any other named parameter, or if you don't 
+                call ``writeStream.trigger()``, the Spark Connector will use 
+                micro-batch processing instead. 
+                
+                To view a list of all supported processing policies, see 
+                `the pyspark trigger documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.trigger.html>`__.
+
+                .. include:: /includes/note-trigger-method
 
-         .. include:: /python/filters.txt
+         The following code snippet shows how to use the preceding 
+         configuration settings to continuously process data streamed from MongoDB.
+         The connector appends all new data to the existing data and asynchronously 
+         writes checkpoints to ``/tmp/checkpointDir`` once per second:
+
+         .. code-block:: python
+            :copyable: true
+            :emphasize-lines: 2, 7, 13
+         
+            streamingDataFrame = (<local SparkSession>.readStream
+              .format("mongodb")
+              .load()
+            )
+         
+            dataStreamWriter = (streamingDataFrame.writeStream
+              .trigger(continuous="1 second")
+              .format("memory")
+              .option("checkpointLocation", "/tmp/checkpointDir")
+              .outputMode("append")
+            )
+
+            query = dataStreamWriter.start()
+
+         .. note::
+            
+            Spark does not begin streaming until you call the 
+            ``start()`` method on a streaming query.
+
+         For a complete list of methods, see the 
+         `pyspark Structured Streaming reference <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__.
 
      - id: scala
        content: |
+         
+         To read data from MongoDB, specify the following read-stream configuration settings on 
+         `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__:  
+
+         .. list-table::
+            :header-rows: 1
+            :stub-columns: 1
+            :widths: 10 40
+         
+            * - Setting
+              - Description
+         
+            * - ``readStream.format()``
+              - The format to use for read stream data. Use ``mongodb``.
+         
+            * - ``writeStream.trigger()``
+              - Specifies how often results should be 
+                written to the streaming sink.
+
+                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
+                as an argument, where ``<time value>`` is how often the Spark Connector 
+                should asynchronously checkpoint. If you 
+                pass any other static method of the ``Trigger`` class, or if you don't 
+                call ``writeStream.trigger()``, the Spark connector will use 
+                micro-batch processing instead. 
+                
+                To view a list of all 
+                supported processing policies, see `the Scala trigger documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#trigger(trigger:org.apache.spark.sql.streaming.Trigger):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
 
-         .. include:: /scala/read-from-mongodb.txt
+                .. include:: /includes/note-trigger-method
 
-         .. include:: /scala/filters.txt
+         The following code snippet shows how to use the preceding 
+         configuration settings to continuously process data streamed from MongoDB.
+         The connector appends all new data to the existing data and asynchronously 
+         writes checkpoints to ``/tmp/checkpointDir`` once per second:
 
-.. important:: Inferring the Schema of a Change Stream
+         .. code-block:: scala
+            :copyable: true
+            :emphasize-lines: 1, 4, 8, 13
+
+            import org.apache.spark.sql.streaming.Trigger
+         
+            val streamingDataFrame = <local SparkSession>.readStream
+              .format("mongodb")
+              .load()
+         
+            val dataStreamWriter = streamingDataFrame.writeStream
+              .trigger(Trigger.Continuous("1 second"))
+              .format("memory")
+              .option("checkpointLocation", "/tmp/checkpointDir")
+              .outputMode("append")
+
+            val query = dataStreamWriter.start()
+
+         .. note::
+            
+            Spark does not begin streaming until you call the 
+            ``start()`` method on a streaming query.
+
+         For a complete list of methods, see the 
+         `Scala Structured Streaming reference <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__.
+
+Examples
+--------
 
-   When the {+connector-short+} infers the schema of a data frame 
-   read from a change stream, by default,
-   it will use the schema of the underlying collection rather than that
-   of the change stream. If you set the ``change.stream.publish.full.document.only``
-   option to ``true``, the connector uses the schema of the 
-   change stream instead.
+The following example shows Spark Structured Streaming configurations 
+for streaming from MongoDB.
 
-   For more information on configuring a read operation, see the
-   :ref:`spark-change-stream-conf` section of the Read Configuration Options guide.
+Stream to your Console from MongoDB
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-SQL Queries
------------
+To stream data from MongoDB to your console:
 
 .. tabs-drivers::
 
    tabs:
+
      - id: java-sync
        content: |
 
-         .. include:: /java/sql.txt
+         1. Create a 
+            `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
+            that reads from MongoDB.
+
+         #. Create a 
+            `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+            by calling the ``writeStream()`` method on the streaming 
+            Dataset or streaming DataFrame that you created with a 
+            ``DataStreamReader``. Specify the format ``console`` using 
+            the ``format()`` method.
+
+         #. Call the ``start()`` method on the ``DataStreamWriter``
+            instance to begin the stream.
+
+         As new data is inserted into MongoDB, MongoDB streams that 
+         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__ 
+         you specify.
+
+         .. include:: /includes/warn-console-stream.txt
+
+         .. code-block:: java
+            :copyable: true
+
+            // create a local SparkSession
+            SparkSession spark = SparkSession.builder()
+              .appName("readExample")
+              .master("spark://spark-master:<port>")
+              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
+              .getOrCreate();
+             
+            // define the schema of the source collection
+            StructType readSchema = new StructType()
+              .add("company_symbol", DataTypes.StringType)
+              .add("company_name", DataTypes.StringType)
+              .add("price", DataTypes.DoubleType)
+              .add("tx_time", DataTypes.TimestampType);
+             
+            // define a streaming query
+            DataStreamWriter<Row> dataStreamWriter = spark.readStream()
+              .format("mongodb")
+              .option("spark.mongodb.connection.uri", "<mongodb-connection-string>")
+              .option("spark.mongodb.database", "<database-name>")
+              .option("spark.mongodb.collection", "<collection-name>")
+              .schema(readSchema)
+              .load()
+              // manipulate your streaming data
+              .writeStream()
+              .format("console")
+              .trigger(Trigger.Continuous("1 second"))
+              .outputMode("append");
+             
+            // run the query
+            StreamingQuery query = dataStreamWriter.start();
 
      - id: python
        content: |
 
-         .. include:: /python/sql.txt
+         1. Create a 
+            `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__ 
+            that reads from MongoDB.
+
+         #. Create a 
+            `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
+            by calling the ``writeStream()`` method on the streaming 
+            DataFrame that you created with a ``DataStreamReader``. 
+            Specify the format ``console`` using the ``format()`` method.
+
+         #. Call the ``start()`` method on the ``DataStreamWriter``
+            instance to begin the stream.
+         
+         As new data is inserted into MongoDB, MongoDB streams that 
+         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__ 
+         you specify.
+
+         .. include:: /includes/warn-console-stream.txt
+
+         .. code-block:: python
+            :copyable: true
+
+            # create a local SparkSession
+            spark = SparkSession.builder \
+              .appName("readExample") \
+              .master("spark://spark-master:<port>") \
+              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>") \
+              .getOrCreate()
+
+            # define the schema of the source collection
+            readSchema = (StructType()
+              .add('company_symbol', StringType())
+              .add('company_name', StringType())
+              .add('price', DoubleType())
+              .add('tx_time', TimestampType())
+            )
+
+            # define a streaming query
+            dataStreamWriter = (spark.readStream
+              .format("mongodb")
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
+              .option('spark.mongodb.database', <database-name>)
+              .option('spark.mongodb.collection', <collection-name>)
+              .schema(readSchema)
+              .load()
+              # manipulate your streaming data
+              .writeStream
+              .format("console")
+              .trigger(continuous="1 second")
+              .outputMode("append")
+            )
+
+            # run the query
+            query = dataStreamWriter.start()  
 
      - id: scala
        content: |
 
-         .. include:: /scala/sql.txt
+         1. Create a 
+            `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
+            that reads from MongoDB.
+
+         #. Create a 
+            `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+            by calling the ``writeStream()`` method on the streaming 
+            Dataset or streaming DataFrame that you created with a 
+            ``DataStreamReader``. Specify the format ``console`` using 
+            the ``format()`` method.
+
+         #. Call the ``start()`` method on the ``DataStreamWriter``
+            instance to begin the stream.
+         
+         As new data is inserted into MongoDB, MongoDB streams that 
+         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__ 
+         you specify.
+
+         .. include:: /includes/warn-console-stream.txt
+
+         .. code-block:: scala
+            :copyable: true
+
+            // create a local SparkSession
+            val spark = SparkSession.builder
+              .appName("readExample")
+              .master("spark://spark-master:<port>")
+              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
+              .getOrCreate()
+
+            // define the schema of the source collection
+            val readSchema = StructType()
+              .add("company_symbol", StringType())
+              .add("company_name", StringType())
+              .add("price", DoubleType())
+              .add("tx_time", TimestampType())
+
+            // define a streaming query
+            val dataStreamWriter = spark.readStream
+              .format("mongodb")
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
+              .option("spark.mongodb.database", <database-name>)
+              .option("spark.mongodb.collection", <collection-name>)
+              .schema(readSchema)
+              .load()
+              // manipulate your streaming data
+              .writeStream
+              .format("console")
+              .trigger(Trigger.Continuous("1 second"))
+              .outputMode("append")
+
+            // run the query
+            val query = dataStreamWriter.start()
+
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index b44aee73..916e4c4f 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -1,13 +1,14 @@
-.. _write-to-mongodb:
-.. _scala-write:
-.. _java-write:
+.. _streaming-write-to-mongodb:
+.. _streaming-scala-write:
+.. _streaming-java-write:
+.. _write-structured-stream:
 
 ================
 Write to MongoDB
 ================
 
 .. toctree::
-   :caption: Read Configuration Options
+   :caption: Write Configuration Options
 
    /streaming-mode/streaming-write-config
 
@@ -16,37 +17,317 @@ Write to MongoDB
 .. tabs-drivers::
 
    tabs:
+
+     - id: java-sync
+       content: |
+
+         Specify write stream configuration settings on your streaming 
+         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. You must specify the following configuration 
+         settings to write to MongoDB:
+         
+         .. list-table::
+            :header-rows: 1
+            :stub-columns: 1
+            :widths: 10 40
+         
+            * - Setting
+              - Description
+         
+            * - ``writeStream.format()``
+              - The format to use for write stream data. Use 
+                ``mongodb``.
+         
+            * - ``writeStream.option()``
+              - Use the ``option()`` method to specify your MongoDB 
+                deployment :manual:`connection string </reference/connection-string/>` with the 
+                ``spark.mongodb.connection.uri`` option key.
+
+                You can also use the ``option()`` method to configure other stream settings, 
+                including the MongoDB database and collection, destination 
+                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+         
+            * - ``writeStream.outputMode()``
+              - Specifies how data of a streaming DataFrame/Dataset is 
+                written to a streaming sink. To view a list of all 
+                supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
+         
+         The following code snippet shows how to use the preceding 
+         configuration settings to stream data to MongoDB:
+
+         .. code-block:: java
+            :copyable: true
+         
+            <streaming Dataset/DataFrame>.writeStream()
+              .format("mongodb")
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
+              .option("spark.mongodb.database", <database-name>)
+              .option("spark.mongodb.collection", <collection-name>)
+              .outputMode("append");
+
+         For a complete list of methods, see the 
+         `Java Structured Streaming reference <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. 
+
+     - id: python
+       content: |
+
+         Specify write stream configuration settings on your streaming 
+         DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__. You 
+         must specify the following configuration settings to write 
+         to MongoDB:
+         
+         .. list-table::
+            :header-rows: 1
+            :stub-columns: 1
+            :widths: 10 40
+         
+            * - Setting
+              - Description
+         
+            * - ``writeStream.format()``
+              - The format to use for write stream data. Use 
+                ``mongodb``.
+         
+            * - ``writeStream.option()``
+              - Use the ``option`` method to specify your MongoDB 
+                deployment :manual:`connection string </reference/connection-string/>` with the 
+                ``spark.mongodb.connection.uri`` option key.
+         
+                You can also use the ``option()`` method to configure other stream settings, 
+                including the MongoDB database and collection, destination 
+                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+
+            * - ``writeStream.outputMode()``
+              - Specifies how data of a streaming DataFrame is 
+                written to a streaming sink. To view a list of all 
+                supported output modes, see `the pyspark outputMode documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__.
+
+         
+         The following code snippet shows how to use the preceding 
+         configuration settings to stream data to MongoDB:
+
+         .. code-block:: python
+            :copyable: true
+         
+            <streaming DataFrame>.writeStream \
+              .format("mongodb") \
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>) \
+              .option("spark.mongodb.database", <database-name>) \
+              .option("spark.mongodb.collection", <collection-name>) \
+              .outputMode("append")
+         
+         For a complete list of methods, see the 
+         `pyspark Structured Streaming reference <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__.
+
+     - id: scala
+       content: |
+
+         Specify write stream configuration settings on your streaming 
+         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. You must specify the following configuration 
+         settings to write to MongoDB:
+         
+         .. list-table::
+            :header-rows: 1
+            :stub-columns: 1
+            :widths: 10 40
+         
+            * - Setting
+              - Description
+         
+            * - ``writeStream.format()``
+              - The format to use for write stream data. Use 
+                ``mongodb``.
+         
+            * - ``writeStream.option()``
+              - Use the ``option`` method to specify your MongoDB 
+                deployment :manual:`connection string </reference/connection-string/>` with the 
+                ``spark.mongodb.connection.uri`` option key.
+         
+                You can also use the ``option()`` method to configure other stream settings, 
+                including the MongoDB database and collection, destination 
+                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+
+            * - ``writeStream.outputMode()``
+              - Specifies how data of a streaming DataFrame/Dataset is 
+                written to a streaming sink. To view a list of all 
+                supported output modes, see `the Scala outputMode documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
+         
+         The following code snippet shows how to use the preceding 
+         configuration settings to stream data to MongoDB:
+
+         .. code-block:: scala
+            :copyable: true
+         
+            <streaming Dataset/DataFrame>.writeStream
+              .format("mongodb")
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
+              .option("spark.mongodb.database", <database-name>)
+              .option("spark.mongodb.collection", <collection-name>)
+              .outputMode("append")
+ 
+         For a complete list of methods, see the 
+         `Scala Structured Streaming reference <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
+
+Examples
+--------
+
+The following example shows Spark Structured Streaming configurations 
+for streaming to MongoDB.
+
+Stream to MongoDB from a CSV File
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+To stream data from a CSV file to MongoDB:
+
+.. tabs-drivers::
+
+   tabs:
+
      - id: java-sync
        content: |
 
-         .. include:: /java/write-to-mongodb.txt
+         1. Create a 
+            `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
+            that reads from the CSV file.
+
+         #. Create a 
+            `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__ 
+            by calling the ``writeStream()`` method on the streaming 
+            Dataset or streaming DataFrame that you created with a 
+            ``DataStreamReader``. Specify the format ``mongodb`` using 
+            the ``format()`` method.
+
+         #. Call the ``start()`` method on the ``DataStreamWriter``
+            instance to begin the stream.
+         
+         As the connector reads data from the CSV file, it adds that 
+         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__ 
+         you specify.
+
+         .. code-block:: java
+            :copyable: true
+
+            // create a local SparkSession
+            SparkSession spark = SparkSession.builder()
+              .appName("writeExample")
+              .master("spark://spark-master:<port>")
+              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
+              .getOrCreate();
+             
+            // define a streaming query
+            DataStreamWriter<Row> dataStreamWriter = spark.readStream()
+              .format("csv")
+              .option("header", "true")
+              .schema("<csv-schema>")
+              .load("<csv-file-name>")
+              // manipulate your streaming data
+              .writeStream()
+              .format("mongodb")
+              .option("checkpointLocation", "/tmp/")
+              .option("forceDeleteTempCheckpointLocation", "true")
+              .option("spark.mongodb.connection.uri", "<mongodb-connection-string>")
+              .option("spark.mongodb.database", "<database-name>")
+              .option("spark.mongodb.collection", "<collection-name>")
+              .outputMode("append");
+             
+            // run the query
+            StreamingQuery query = dataStreamWriter.start();
 
      - id: python
        content: |
 
-         .. include:: /python/write-to-mongodb.txt
+         1. Create a 
+            `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__ 
+            that reads from the CSV file.
+
+         #. Create a 
+            `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
+            by calling the ``writeStream()`` method on the streaming 
+            DataFrame that you created with a ``DataStreamReader``. 
+            Specify the format ``mongodb`` using the ``format()`` method.
+
+         #. Call the ``start()`` method on the ``DataStreamWriter``
+            instance to begin the stream.
+         
+         As the connector reads data from the CSV file, it adds that 
+         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__ 
+         you specify.
+
+         .. code-block:: python
+            :copyable: true
+
+            # create a local SparkSession
+            spark = SparkSession.builder \
+              .appName("writeExample") \
+              .master("spark://spark-master:<port>") \
+              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>") \
+              .getOrCreate()
+
+            # define a streaming query
+            dataStreamWriter = (spark.readStream
+              .format("csv")
+              .option("header", "true")
+              .schema(<csv-schema>)
+              .load(<csv-file-name>)
+              # manipulate your streaming data
+              .writeStream
+              .format("mongodb")
+              .option("checkpointLocation", "/tmp/pyspark/")
+              .option("forceDeleteTempCheckpointLocation", "true")
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
+              .option("spark.mongodb.database", <database-name>)
+              .option("spark.mongodb.collection", <collection-name>)
+              .outputMode("append")
+            )
+
+            # run the query
+            query = dataStreamWriter.start()
 
      - id: scala
        content: |
 
-         .. include:: /scala/write-to-mongodb.txt
+         1. Create a 
+            `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
+            that reads from the CSV file.
+
+         #. Create a 
+            `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+            by calling the ``writeStream()`` method on the streaming 
+            Dataset or streaming DataFrame that you created with a 
+            ``DataStreamReader``. Specify the format ``mongodb`` using 
+            the ``format()`` method.
 
-.. warning:: Setting the Write Mode to ``overwrite``
+         #. Call the ``start()`` method on the ``DataStreamWriter``
+            instance to begin the stream.
+         
+         As the connector reads data from the CSV file, it adds that 
+         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__ 
+         you specify.
 
-   If you specify the ``overwrite`` write mode, the connector drops the target
-   collection and creates a new collection that uses the
-   default collection options.
-   This behavior can affect collections that don't use the default options,
-   such as the following collection types:
+         .. code-block:: scala
+            :copyable: true
 
-   - Sharded collections
-   - Collections with non-default collations
-   - Time-series collections
+            // create a local SparkSession
+            val spark = SparkSession.builder
+              .appName("writeExample")
+              .master("spark://spark-master:<port>")
+              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
+              .getOrCreate()
 
-.. important::
+            // define a streaming query
+            val dataStreamWriter = spark.readStream
+              .format("csv")
+              .option("header", "true")
+              .schema(<csv-schema>)
+              .load(<csv-file-name>)
+              // manipulate your streaming data
+              .writeStream
+              .format("mongodb")
+              .option("checkpointLocation", "/tmp/")
+              .option("forceDeleteTempCheckpointLocation", "true")
+              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
+              .option("spark.mongodb.database", <database-name>)
+              .option("spark.mongodb.collection", <collection-name>)
+              .outputMode("append")
 
-   If your write operation includes a field with a ``null`` value,
-   the connector writes the field name and ``null`` value to MongoDB. You can
-   change this behavior by setting the write configuration property
-   ``ignoreNullValues``. For more information about setting the connector's
-   write behavior, see :ref:`Write Configuration Options <spark-write-conf>`.
+            // run the query
+            val query = dataStreamWriter.start()
diff --git a/source/structured-streaming.txt b/source/structured-streaming.txt
deleted file mode 100644
index 4b93b4df..00000000
--- a/source/structured-streaming.txt
+++ /dev/null
@@ -1,755 +0,0 @@
-.. _spark-structured-streaming:
-
-=================================
-Structured Streaming with MongoDB
-=================================
-
-.. default-domain:: mongodb
-
-.. contents:: On this page
-   :local:
-   :backlinks: none
-   :depth: 2
-   :class: singlecol
-
-Overview
---------
-
-Spark Structured Streaming is a data stream processing engine you can 
-use through the Dataset or DataFrame API. The MongoDB Spark Connector 
-enables you to stream to and from MongoDB using Spark Structured 
-Streaming.
-
-.. include:: includes/streaming-distinction.rst
-
-To learn more about Structured Streaming, see the 
-`Spark Programming Guide
-<https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.
-
-.. _write-structured-stream:
-
-Configuring a Write Stream to MongoDB
--------------------------------------
-
-.. tabs-selector:: drivers
-
-.. tabs-drivers::
-
-   tabs:
-
-     - id: java-sync
-       content: |
-
-         Specify write stream configuration settings on your streaming 
-         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. You must specify the following configuration 
-         settings to write to MongoDB:
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``writeStream.format()``
-              - The format to use for write stream data. Use 
-                ``mongodb``.
-         
-            * - ``writeStream.option()``
-              - Use the ``option()`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
-         
-            * - ``writeStream.outputMode()``
-              - Specifies how data of a streaming DataFrame/Dataset is 
-                written to a streaming sink. To view a list of all 
-                supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
-         
-         The following code snippet shows how to use the preceding 
-         configuration settings to stream data to MongoDB:
-
-         .. code-block:: java
-            :copyable: true
-         
-            <streaming Dataset/DataFrame>.writeStream()
-              .format("mongodb")
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
-              .option("spark.mongodb.database", <database-name>)
-              .option("spark.mongodb.collection", <collection-name>)
-              .outputMode("append");
-
-         For a complete list of methods, see the 
-         `Java Structured Streaming reference <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. 
-
-     - id: python
-       content: |
-
-         Specify write stream configuration settings on your streaming 
-         DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__. You 
-         must specify the following configuration settings to write 
-         to MongoDB:
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``writeStream.format()``
-              - The format to use for write stream data. Use 
-                ``mongodb``.
-         
-            * - ``writeStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
-
-            * - ``writeStream.outputMode()``
-              - Specifies how data of a streaming DataFrame is 
-                written to a streaming sink. To view a list of all 
-                supported output modes, see `the pyspark outputMode documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__.
-
-         
-         The following code snippet shows how to use the preceding 
-         configuration settings to stream data to MongoDB:
-
-         .. code-block:: python
-            :copyable: true
-         
-            <streaming DataFrame>.writeStream \
-              .format("mongodb") \
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>) \
-              .option("spark.mongodb.database", <database-name>) \
-              .option("spark.mongodb.collection", <collection-name>) \
-              .outputMode("append")
-         
-         For a complete list of methods, see the 
-         `pyspark Structured Streaming reference <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__.
-
-     - id: scala
-       content: |
-
-         Specify write stream configuration settings on your streaming 
-         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. You must specify the following configuration 
-         settings to write to MongoDB:
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``writeStream.format()``
-              - The format to use for write stream data. Use 
-                ``mongodb``.
-         
-            * - ``writeStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
-
-            * - ``writeStream.outputMode()``
-              - Specifies how data of a streaming DataFrame/Dataset is 
-                written to a streaming sink. To view a list of all 
-                supported output modes, see `the Scala outputMode documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
-         
-         The following code snippet shows how to use the preceding 
-         configuration settings to stream data to MongoDB:
-
-         .. code-block:: scala
-            :copyable: true
-         
-            <streaming Dataset/DataFrame>.writeStream
-              .format("mongodb")
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
-              .option("spark.mongodb.database", <database-name>)
-              .option("spark.mongodb.collection", <collection-name>)
-              .outputMode("append")
- 
-         For a complete list of methods, see the 
-         `Scala Structured Streaming reference <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
-
-.. _read-structured-stream:
-.. _continuous-processing:
-
-Configuring a Read Stream from MongoDB
---------------------------------------
-When reading a stream from a MongoDB database, the {+connector-long+} supports both 
-*micro-batch processing* and 
-*continuous processing*. Micro-batch processing is the default processing engine, while
-continuous processing is an experimental feature introduced in 
-Spark version 2.3. To learn 
-more about continuous processing, see the `Spark documentation <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#continuous-processing>`__.
-
-.. include:: /includes/fact-read-from-change-stream
-
-.. note::
-
-    Since Structured Streaming produces a single partition, it ignores
-    :ref:`partitioner configurations <partitioner-conf>`. Partitioner
-    configuration only apply when there are multiple partitions. This is true
-    for both micro-batch processing and continuous processing streams.
-
-.. tabs-drivers::
-
-   tabs:
-
-     - id: java-sync
-       content: |
-
-         To read data from MongoDB, specify the following read-stream configuration settings on 
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__: 
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``readStream.format()``
-              - The format to use for read stream data. Use ``mongodb``.
-         
-            * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink. 
-                
-                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-                as an argument, where ``<time value>`` is how often the Spark Connector 
-                should asynchronously checkpoint. If you 
-                pass any other static method of the ``Trigger`` class, or if you don't 
-                call ``writeStream.trigger()``, the Spark connector will use 
-                micro-batch processing instead. 
-  
-                To view a list of all supported processing policies, see `the Java 
-                trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
-
-                .. include:: /includes/note-trigger-method
-
-         The following code snippet shows how to use the preceding 
-         configuration settings to continuously process data streamed from MongoDB.
-         The connector appends all new data to the existing data and asynchronously 
-         writes checkpoints to ``/tmp/checkpointDir`` once per second:
-
-         .. code-block:: java
-            :copyable: true
-            :emphasize-lines: 1, 4, 8, 13
-
-            import org.apache.spark.sql.streaming.Trigger;
- 
-            Dataset<Row> streamingDataset = <local SparkSession>.readStream()
-              .format("mongodb")
-              .load();
- 
-            DataStreamWriter<Row> dataStreamWriter = streamingDataset.writeStream()
-              .trigger(Trigger.Continuous("1 second"))
-              .format("memory")
-              .option("checkpointLocation", "/tmp/checkpointDir")
-              .outputMode("append");
- 
-            StreamingQuery query = dataStreamWriter.start();
-
-         .. note::
-            
-            Spark does not begin streaming until you call the 
-            ``start()`` method on a streaming query.
-
-         For a complete list of methods, see the 
-         `Java Structured Streaming reference <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__.
-
-     - id: python
-       content: |
-
-         To read data from MongoDB, specify the following read-stream configuration settings on 
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__:  
-
-         To use continuous processing with the MongoDB Spark Connector, 
-         call the ``trigger()`` method on the ``writeStream`` property 
-         of the streaming DataFrame that you create from 
-         your MongoDB read stream. In your ``trigger()``, specify the 
-         ``continuous`` parameter.
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``readStream.format()``
-              - The format to use for read stream data. Use ``mongodb``.
-         
-            * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink. 
-
-                To use continuous processing, pass the method a time value 
-                using the ``continuous`` parameter.
-                If you pass any other named parameter, or if you don't 
-                call ``writeStream.trigger()``, the Spark Connector will use 
-                micro-batch processing instead. 
-                
-                To view a list of all supported processing policies, see 
-                `the pyspark trigger documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.trigger.html>`__.
-
-                .. include:: /includes/note-trigger-method
-
-         The following code snippet shows how to use the preceding 
-         configuration settings to continuously process data streamed from MongoDB.
-         The connector appends all new data to the existing data and asynchronously 
-         writes checkpoints to ``/tmp/checkpointDir`` once per second:
-
-         .. code-block:: python
-            :copyable: true
-            :emphasize-lines: 2, 7, 13
-         
-            streamingDataFrame = (<local SparkSession>.readStream
-              .format("mongodb")
-              .load()
-            )
-         
-            dataStreamWriter = (streamingDataFrame.writeStream
-              .trigger(continuous="1 second")
-              .format("memory")
-              .option("checkpointLocation", "/tmp/checkpointDir")
-              .outputMode("append")
-            )
-
-            query = dataStreamWriter.start()
-
-         .. note::
-            
-            Spark does not begin streaming until you call the 
-            ``start()`` method on a streaming query.
-
-         For a complete list of methods, see the 
-         `pyspark Structured Streaming reference <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__.
-
-     - id: scala
-       content: |
-         
-         To read data from MongoDB, specify the following read-stream configuration settings on 
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__:  
-
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``readStream.format()``
-              - The format to use for read stream data. Use ``mongodb``.
-         
-            * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink.
-
-                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-                as an argument, where ``<time value>`` is how often the Spark Connector 
-                should asynchronously checkpoint. If you 
-                pass any other static method of the ``Trigger`` class, or if you don't 
-                call ``writeStream.trigger()``, the Spark connector will use 
-                micro-batch processing instead. 
-                
-                To view a list of all 
-                supported processing policies, see `the Scala trigger documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#trigger(trigger:org.apache.spark.sql.streaming.Trigger):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
-
-                .. include:: /includes/note-trigger-method
-
-         The following code snippet shows how to use the preceding 
-         configuration settings to continuously process data streamed from MongoDB.
-         The connector appends all new data to the existing data and asynchronously 
-         writes checkpoints to ``/tmp/checkpointDir`` once per second:
-
-         .. code-block:: scala
-            :copyable: true
-            :emphasize-lines: 1, 4, 8, 13
-
-            import org.apache.spark.sql.streaming.Trigger
-         
-            val streamingDataFrame = <local SparkSession>.readStream
-              .format("mongodb")
-              .load()
-         
-            val dataStreamWriter = streamingDataFrame.writeStream
-              .trigger(Trigger.Continuous("1 second"))
-              .format("memory")
-              .option("checkpointLocation", "/tmp/checkpointDir")
-              .outputMode("append")
-
-            val query = dataStreamWriter.start()
-
-         .. note::
-            
-            Spark does not begin streaming until you call the 
-            ``start()`` method on a streaming query.
-
-         For a complete list of methods, see the 
-         `Scala Structured Streaming reference <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__.
-
-Examples
---------
-
-The following examples show Spark Structured Streaming configurations 
-for streaming to and from MongoDB.
-
-Stream to MongoDB from a CSV File
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-To stream data from a CSV file to MongoDB:
-
-.. tabs-drivers::
-
-   tabs:
-
-     - id: java-sync
-       content: |
-
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from the CSV file.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__ 
-            by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``mongodb`` using 
-            the ``format()`` method.
-
-         #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
-         
-         As the connector reads data from the CSV file, it adds that 
-         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__ 
-         you specify.
-
-         .. code-block:: java
-            :copyable: true
-
-            // create a local SparkSession
-            SparkSession spark = SparkSession.builder()
-              .appName("writeExample")
-              .master("spark://spark-master:<port>")
-              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
-              .getOrCreate();
-             
-            // define a streaming query
-            DataStreamWriter<Row> dataStreamWriter = spark.readStream()
-              .format("csv")
-              .option("header", "true")
-              .schema("<csv-schema>")
-              .load("<csv-file-name>")
-              // manipulate your streaming data
-              .writeStream()
-              .format("mongodb")
-              .option("checkpointLocation", "/tmp/")
-              .option("forceDeleteTempCheckpointLocation", "true")
-              .option("spark.mongodb.connection.uri", "<mongodb-connection-string>")
-              .option("spark.mongodb.database", "<database-name>")
-              .option("spark.mongodb.collection", "<collection-name>")
-              .outputMode("append");
-             
-            // run the query
-            StreamingQuery query = dataStreamWriter.start();
-
-     - id: python
-       content: |
-
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__ 
-            that reads from the CSV file.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            DataFrame that you created with a ``DataStreamReader``. 
-            Specify the format ``mongodb`` using the ``format()`` method.
-
-         #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
-         
-         As the connector reads data from the CSV file, it adds that 
-         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__ 
-         you specify.
-
-         .. code-block:: python
-            :copyable: true
-
-            # create a local SparkSession
-            spark = SparkSession.builder \
-              .appName("writeExample") \
-              .master("spark://spark-master:<port>") \
-              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>") \
-              .getOrCreate()
-
-            # define a streaming query
-            dataStreamWriter = (spark.readStream
-              .format("csv")
-              .option("header", "true")
-              .schema(<csv-schema>)
-              .load(<csv-file-name>)
-              # manipulate your streaming data
-              .writeStream
-              .format("mongodb")
-              .option("checkpointLocation", "/tmp/pyspark/")
-              .option("forceDeleteTempCheckpointLocation", "true")
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
-              .option("spark.mongodb.database", <database-name>)
-              .option("spark.mongodb.collection", <collection-name>)
-              .outputMode("append")
-            )
-
-            # run the query
-            query = dataStreamWriter.start()
-
-     - id: scala
-       content: |
-
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from the CSV file.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``mongodb`` using 
-            the ``format()`` method.
-
-         #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
-         
-         As the connector reads data from the CSV file, it adds that 
-         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__ 
-         you specify.
-
-         .. code-block:: scala
-            :copyable: true
-
-            // create a local SparkSession
-            val spark = SparkSession.builder
-              .appName("writeExample")
-              .master("spark://spark-master:<port>")
-              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
-              .getOrCreate()
-
-            // define a streaming query
-            val dataStreamWriter = spark.readStream
-              .format("csv")
-              .option("header", "true")
-              .schema(<csv-schema>)
-              .load(<csv-file-name>)
-              // manipulate your streaming data
-              .writeStream
-              .format("mongodb")
-              .option("checkpointLocation", "/tmp/")
-              .option("forceDeleteTempCheckpointLocation", "true")
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
-              .option("spark.mongodb.database", <database-name>)
-              .option("spark.mongodb.collection", <collection-name>)
-              .outputMode("append")
-
-            // run the query
-            val query = dataStreamWriter.start()
-
-Stream to your Console from MongoDB
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-To stream data from MongoDB to your console:
-
-.. tabs-drivers::
-
-   tabs:
-
-     - id: java-sync
-       content: |
-
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from MongoDB.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``console`` using 
-            the ``format()`` method.
-
-         #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
-
-         As new data is inserted into MongoDB, MongoDB streams that 
-         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__ 
-         you specify.
-
-         .. include:: /includes/warn-console-stream.txt
-
-         .. code-block:: java
-            :copyable: true
-
-            // create a local SparkSession
-            SparkSession spark = SparkSession.builder()
-              .appName("readExample")
-              .master("spark://spark-master:<port>")
-              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
-              .getOrCreate();
-             
-            // define the schema of the source collection
-            StructType readSchema = new StructType()
-              .add("company_symbol", DataTypes.StringType)
-              .add("company_name", DataTypes.StringType)
-              .add("price", DataTypes.DoubleType)
-              .add("tx_time", DataTypes.TimestampType);
-             
-            // define a streaming query
-            DataStreamWriter<Row> dataStreamWriter = spark.readStream()
-              .format("mongodb")
-              .option("spark.mongodb.connection.uri", "<mongodb-connection-string>")
-              .option("spark.mongodb.database", "<database-name>")
-              .option("spark.mongodb.collection", "<collection-name>")
-              .schema(readSchema)
-              .load()
-              // manipulate your streaming data
-              .writeStream()
-              .format("console")
-              .trigger(Trigger.Continuous("1 second"))
-              .outputMode("append");
-             
-            // run the query
-            StreamingQuery query = dataStreamWriter.start();
-
-     - id: python
-       content: |
-
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__ 
-            that reads from MongoDB.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            DataFrame that you created with a ``DataStreamReader``. 
-            Specify the format ``console`` using the ``format()`` method.
-
-         #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
-         
-         As new data is inserted into MongoDB, MongoDB streams that 
-         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__ 
-         you specify.
-
-         .. include:: /includes/warn-console-stream.txt
-
-         .. code-block:: python
-            :copyable: true
-
-            # create a local SparkSession
-            spark = SparkSession.builder \
-              .appName("readExample") \
-              .master("spark://spark-master:<port>") \
-              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>") \
-              .getOrCreate()
-
-            # define the schema of the source collection
-            readSchema = (StructType()
-              .add('company_symbol', StringType())
-              .add('company_name', StringType())
-              .add('price', DoubleType())
-              .add('tx_time', TimestampType())
-            )
-
-            # define a streaming query
-            dataStreamWriter = (spark.readStream
-              .format("mongodb")
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
-              .option('spark.mongodb.database', <database-name>)
-              .option('spark.mongodb.collection', <collection-name>)
-              .schema(readSchema)
-              .load()
-              # manipulate your streaming data
-              .writeStream
-              .format("console")
-              .trigger(continuous="1 second")
-              .outputMode("append")
-            )
-
-            # run the query
-            query = dataStreamWriter.start()  
-
-     - id: scala
-       content: |
-
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from MongoDB.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``console`` using 
-            the ``format()`` method.
-
-         #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
-         
-         As new data is inserted into MongoDB, MongoDB streams that 
-         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__ 
-         you specify.
-
-         .. include:: /includes/warn-console-stream.txt
-
-         .. code-block:: scala
-            :copyable: true
-
-            // create a local SparkSession
-            val spark = SparkSession.builder
-              .appName("readExample")
-              .master("spark://spark-master:<port>")
-              .config("spark.jars", "<mongo-spark-connector-JAR-file-name>")
-              .getOrCreate()
-
-            // define the schema of the source collection
-            val readSchema = StructType()
-              .add("company_symbol", StringType())
-              .add("company_name", StringType())
-              .add("price", DoubleType())
-              .add("tx_time", TimestampType())
-
-            // define a streaming query
-            val dataStreamWriter = spark.readStream
-              .format("mongodb")
-              .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
-              .option("spark.mongodb.database", <database-name>)
-              .option("spark.mongodb.collection", <collection-name>)
-              .schema(readSchema)
-              .load()
-              // manipulate your streaming data
-              .writeStream
-              .format("console")
-              .trigger(Trigger.Continuous("1 second"))
-              .outputMode("append")
-
-            // run the query
-            val query = dataStreamWriter.start()

From 4b9aee2de7f6a543bd8675c113ad488fbb191207 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 13 Oct 2023 11:01:02 -0500
Subject: [PATCH 10/65] fix

---
 source/index.txt | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/source/index.txt b/source/index.txt
index f8e6c808..0898016f 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -49,9 +49,8 @@ versions of Apache Spark and MongoDB:
 
    getting-started
    configuration
-   /batch-mode
-   /streaming-mode
-   structured-streaming
+   batch-mode
+   streaming-mode
    faq
    release-notes
    api-docs

From 76509b31e4f516a0dc44e4c78cfda4ceb71f1012 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 13 Oct 2023 11:28:14 -0500
Subject: [PATCH 11/65] fix

---
 source/batch-mode.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/source/batch-mode.txt b/source/batch-mode.txt
index 83443fbd..2ea48d76 100644
--- a/source/batch-mode.txt
+++ b/source/batch-mode.txt
@@ -10,3 +10,6 @@ Batch Mode
 
    /batch-mode/batch-read
    /batch-mode/batch-write
+
+Overview
+--------

From 716b687be5471fb1a790c3a865a4c54e5bd58cdd Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 13 Oct 2023 11:36:52 -0500
Subject: [PATCH 12/65] fix

---
 source/batch-mode.txt     | 4 ----
 source/index.txt          | 6 ++----
 source/streaming-mode.txt | 4 ----
 3 files changed, 2 insertions(+), 12 deletions(-)

diff --git a/source/batch-mode.txt b/source/batch-mode.txt
index 2ea48d76..ebad51bb 100644
--- a/source/batch-mode.txt
+++ b/source/batch-mode.txt
@@ -2,11 +2,7 @@
 Batch Mode
 ==========
 
-.. meta::
-   :description: Use the {+connector-long+} to read and write batches of data. 
-
 .. toctree::
-   :caption: Batch Mode
 
    /batch-mode/batch-read
    /batch-mode/batch-write
diff --git a/source/index.txt b/source/index.txt
index 0898016f..15a9a061 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -2,8 +2,6 @@
 MongoDB Connector for Spark
 ===========================
 
-.. default-domain:: mongodb
-
 The `MongoDB Connector for Spark
 <https://www.mongodb.com/products/spark-connector>`_ provides
 integration between MongoDB and Apache Spark.
@@ -49,8 +47,8 @@ versions of Apache Spark and MongoDB:
 
    getting-started
    configuration
-   batch-mode
-   streaming-mode
+   /batch-mode
+   /streaming-mode
    faq
    release-notes
    api-docs
diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
index b0973255..2f24bf66 100644
--- a/source/streaming-mode.txt
+++ b/source/streaming-mode.txt
@@ -8,11 +8,7 @@ Streaming Mode
    :depth: 2
    :class: singlecol
 
-.. meta::
-   :description: Use the {+connector-long+} to stream data. 
-
 .. toctree::
-   :caption: Streaming Mode
 
    /streaming-mode/streaming-read
    /streaming-mode/streaming-write

From 8ee6d4c1ffd24303f4b105ee5d7c6f5a92206c18 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 13 Oct 2023 12:02:09 -0500
Subject: [PATCH 13/65] -a

---
 source/index.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/source/index.txt b/source/index.txt
index 15a9a061..21d8ce31 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -47,8 +47,8 @@ versions of Apache Spark and MongoDB:
 
    getting-started
    configuration
-   /batch-mode
-   /streaming-mode
+   batch-mode
+   streaming-mode
    faq
    release-notes
    api-docs

From 6e9504cbe76eb8a98694deaf864b66797e2d72d9 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 13 Oct 2023 12:06:34 -0500
Subject: [PATCH 14/65] -a

---
 snooty.toml      | 10 +++++++++-
 source/index.txt |  4 ++--
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/snooty.toml b/snooty.toml
index 677d69a9..a1247e21 100644
--- a/snooty.toml
+++ b/snooty.toml
@@ -3,7 +3,15 @@ title = "MongoDB Spark Connector"
 
 intersphinx = ["https://www.mongodb.com/docs/manual/objects.inv"]
 
-toc_landing_pages = ["configuration"]
+toc_landing_pages = [
+    "configuration",
+    "/batch-mode",
+    "/streaming-mode",
+    "/streaming-mode/streaming-read",
+    "/streaming-mode/streaming-write",
+    "/batch-mode/batch-write",
+    "/batch-mode/batch-read",
+]
 
 [constants]
 connector-short = "Spark Connector"
diff --git a/source/index.txt b/source/index.txt
index 21d8ce31..15a9a061 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -47,8 +47,8 @@ versions of Apache Spark and MongoDB:
 
    getting-started
    configuration
-   batch-mode
-   streaming-mode
+   /batch-mode
+   /streaming-mode
    faq
    release-notes
    api-docs

From b92f2ae6e172198bb6f9382c8bc177bda4038d22 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 13 Oct 2023 14:32:03 -0500
Subject: [PATCH 15/65] wip

---
 source/batch-mode.txt | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/source/batch-mode.txt b/source/batch-mode.txt
index ebad51bb..1bf97994 100644
--- a/source/batch-mode.txt
+++ b/source/batch-mode.txt
@@ -2,6 +2,12 @@
 Batch Mode
 ==========
 
+.. contents:: On this page
+   :local:
+   :backlinks: none
+   :depth: 1
+   :class: singlecol
+
 .. toctree::
 
    /batch-mode/batch-read
@@ -9,3 +15,9 @@ Batch Mode
 
 Overview
 --------
+
+The following sections show you how to use the {+connector-short+} to read data from
+MongoDB and write data to MongoDB in batch mode:
+
+- :ref:batch-read-from-mongodb
+- :ref:batch-write-to-mongodb
\ No newline at end of file

From 608f7845d79293a67e8c7a29f7206a7e55db3181 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 16 Oct 2023 15:46:10 -0500
Subject: [PATCH 16/65] wip

---
 source/batch-mode.txt                     | 11 +++++++++-
 source/includes/streaming-distinction.rst |  7 ++++++-
 source/streaming-mode.txt                 | 25 +++++++++++++++--------
 3 files changed, 33 insertions(+), 10 deletions(-)

diff --git a/source/batch-mode.txt b/source/batch-mode.txt
index 1bf97994..f582f5e0 100644
--- a/source/batch-mode.txt
+++ b/source/batch-mode.txt
@@ -16,8 +16,17 @@ Batch Mode
 Overview
 --------
 
+In batch mode, you can use the Spark Dataset and DataFrame APIs to process data at
+a specified time interval.
+
 The following sections show you how to use the {+connector-short+} to read data from
 MongoDB and write data to MongoDB in batch mode:
 
 - :ref:batch-read-from-mongodb
-- :ref:batch-write-to-mongodb
\ No newline at end of file
+- :ref:batch-write-to-mongodb
+
+.. tip:: Apache Spark Documentation
+
+   To learn more about using Spark to process batches of data, see the 
+   `Spark Programming Guide
+   <https://spark.apache.org/docs/latest/sql-programming-guide.html>`__.
\ No newline at end of file
diff --git a/source/includes/streaming-distinction.rst b/source/includes/streaming-distinction.rst
index dc7fa4c2..ed5bd3f4 100644
--- a/source/includes/streaming-distinction.rst
+++ b/source/includes/streaming-distinction.rst
@@ -1,3 +1,8 @@
 .. important::
 
-   `Spark Structured Streaming <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__ and `Spark Streaming with DStreams <https://spark.apache.org/docs/latest/streaming-programming-guide.html>`__ are different. 
+   Apache Spark contains two different stream-processing engines:
+   `Spark Streaming with DStreams <https://spark.apache.org/docs/latest/streaming-programming-guide.html>`__,
+   now an unsupported legacy engine, and
+   `Spark Structured Streaming <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.
+
+   This guide pertains only to Spark Structured Streaming. 
\ No newline at end of file
diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
index 2f24bf66..94eca65e 100644
--- a/source/streaming-mode.txt
+++ b/source/streaming-mode.txt
@@ -5,7 +5,7 @@ Streaming Mode
 .. contents:: On this page
    :local:
    :backlinks: none
-   :depth: 2
+   :depth: 1
    :class: singlecol
 
 .. toctree::
@@ -13,13 +13,22 @@ Streaming Mode
    /streaming-mode/streaming-read
    /streaming-mode/streaming-write
 
-Spark Structured Streaming is a data stream processing engine you can 
-use through the Dataset or DataFrame API. The MongoDB Spark Connector 
-enables you to stream to and from MongoDB using Spark Structured 
-Streaming.
+Overview
+--------
+
+In streaming mode, you can use Spark Structured Streaming to process data as soon as
+it's available instead of waiting for a time interval to pass.
 
 .. include:: includes/streaming-distinction.rst
 
-To learn more about Structured Streaming, see the 
-`Spark Programming Guide
-<https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.
+The following sections show you how to use the {+connector-short+} to read data from
+MongoDB and write data to MongoDB in streaming mode:
+
+- :ref:streaming-read-from-mongodb
+- :ref:streaming-write-to-mongodb
+
+.. tip:: Apache Spark Documentation
+
+   To learn more about using Spark to process streams of data, see the 
+   `Spark Programming Guide
+   <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.

From 832ebd501649dad267a34bb38f0c9d58fc4401ad Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 16 Oct 2023 15:51:21 -0500
Subject: [PATCH 17/65] wip

---
 source/batch-mode.txt     | 4 ++--
 source/streaming-mode.txt | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/source/batch-mode.txt b/source/batch-mode.txt
index f582f5e0..5f5119a2 100644
--- a/source/batch-mode.txt
+++ b/source/batch-mode.txt
@@ -22,8 +22,8 @@ a specified time interval.
 The following sections show you how to use the {+connector-short+} to read data from
 MongoDB and write data to MongoDB in batch mode:
 
-- :ref:batch-read-from-mongodb
-- :ref:batch-write-to-mongodb
+- :ref:`batch-read-from-mongodb`
+- :ref:`batch-write-to-mongodb`
 
 .. tip:: Apache Spark Documentation
 
diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
index 94eca65e..1bc8c6c2 100644
--- a/source/streaming-mode.txt
+++ b/source/streaming-mode.txt
@@ -24,8 +24,8 @@ it's available instead of waiting for a time interval to pass.
 The following sections show you how to use the {+connector-short+} to read data from
 MongoDB and write data to MongoDB in streaming mode:
 
-- :ref:streaming-read-from-mongodb
-- :ref:streaming-write-to-mongodb
+- :ref:`streaming-read-from-mongodb`
+- :ref:`streaming-write-to-mongodb`
 
 .. tip:: Apache Spark Documentation
 

From dbf7f3386a88b15f5ee83d2eb6ad435235cb02e1 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 16 Oct 2023 16:05:01 -0500
Subject: [PATCH 18/65] batch config

---
 source/batch-mode/batch-read-config.txt       | 104 +-----------------
 source/batch-mode/batch-read.txt              |  13 +--
 source/batch-mode/batch-write-config.txt      |  10 +-
 source/batch-mode/batch-write.txt             |   3 +-
 source/streaming-mode/streaming-read.txt      |  13 +++
 .../streaming-mode/streaming-write-config.txt |  93 ++++++++++++++++
 6 files changed, 117 insertions(+), 119 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index b35ad9f7..bef5ed1e 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -1,4 +1,5 @@
 .. _spark-read-conf:
+.. _spark-batch-read-conf:
 
 ==========================
 Read Configuration Options
@@ -11,11 +12,12 @@ Read Configuration Options
    :class: singlecol
 
 .. _spark-input-conf:
+.. _spark-batch-input-conf:
 
 Read Configuration
 ------------------
 
-You can configure the following properties to read from MongoDB:
+You can configure the following properties when reading data from MongoDB in batch mode:
 
 .. note::
 
@@ -153,14 +155,12 @@ partitioners:
 .. _conf-samplepartitioner:
 
 ``SamplePartitioner`` Configuration
-```````````````````````````````````
 
 .. include:: /includes/sparkconf-partitioner-options-note.rst
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``.
 
-
 .. list-table::
    :header-rows: 1
    :widths: 35 65
@@ -179,7 +179,6 @@ You must specify this partitioner using the full classname:
 
        **Default:** ``64``
 
-
    * - ``partitioner.options.samples.per.partition``
      - The number of samples to take per partition. The total number of
        samples taken is:
@@ -205,7 +204,6 @@ You must specify this partitioner using the full classname:
 
 ``ShardedPartitioner`` Configuration
 `````````````````````````````````````
-
 The ``ShardedPartitioner`` automatically determines the partitions to use
 based on your shard configuration.
 
@@ -216,7 +214,6 @@ You must specify this partitioner using the full classname:
 
    This partitioner is not compatible with hashed shard keys.
 
-
 .. _conf-mongopaginatebysizepartitioner:
 .. _conf-paginatebysizepartitioner:
 
@@ -251,13 +248,11 @@ You must specify this partitioner using the full classname:
 
 ``PaginateIntoPartitionsPartitioner`` Configuration
 ```````````````````````````````````````````````````
-
 .. include:: /includes/sparkconf-partitioner-options-note.rst
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateIntoPartitionsPartitioner``.
 
-
 .. list-table::
    :header-rows: 1
    :widths: 35 65
@@ -287,99 +282,6 @@ You must specify this partitioner using the full classname:
 
 This partitioner creates a single partition.
 
-.. _spark-change-stream-conf:
-
-Change Streams
---------------
-
-.. note::
-
-   If you use ``SparkConf`` to set the connector's change stream
-   configurations, prefix ``spark.mongodb.`` to each property.
-
-.. list-table::
-   :header-rows: 1
-   :widths: 35 65
-
-   * - Property name
-     - Description
-
-   * - ``change.stream.lookup.full.document``
-
-     - Determines what values your change stream returns on update
-       operations.
-
-       The default setting returns the differences between the original
-       document and the updated document.
-
-       The ``updateLookup`` setting returns the differences between the
-       original document and updated document as well as a copy of the
-       entire updated document.
-
-       **Default:** "default"
-
-       .. tip::
-
-          For more information on how this change stream option works,
-          see the MongoDB server manual guide
-          :manual:`Lookup Full Document for Update Operation </changeStreams/#lookup-full-document-for-update-operations>`.
-
-   * - ``change.stream.micro.batch.max.partition.count``
-     - | The maximum number of partitions the {+connector-short+} divides each 
-         micro-batch into. Spark workers can process these partitions in parallel.
-       |  
-       | This setting applies only when using micro-batch streams.
-       |
-       | **Default**: ``1``
-
-       .. warning:: Event Order
-
-          Specifying a value larger than ``1`` can alter the order in which
-          the {+connector-short+} processes change events. Avoid this setting
-          if out-of-order processing could create data inconsistencies downstream. 
-
-   * - ``change.stream.publish.full.document.only``
-     - | Specifies whether to publish the changed document or the full
-         change stream document.
-       |
-       | When this setting is ``true``, the connector exhibits the following behavior:
-       
-       - The connector filters out messages that
-         omit the ``fullDocument`` field and only publishes the value of the
-         field.
-       - If you don't specify a schema, the connector infers the schema
-         from the change stream document rather than from the underlying collection.
-
-         **Default**: ``false``
-       
-       .. note::
-
-          This setting overrides the ``change.stream.lookup.full.document``
-          setting.
-
-   * - ``change.stream.startup.mode``
-     - | Specifies how the connector starts up when no offset is available.
-       
-       | This setting accepts the following values:
-        
-       - ``latest``: The connector begins processing
-         change events starting with the most recent event.
-         It will not process any earlier unprocessed events.
-       - ``timestamp``: The connector begins processing change events at a specified time.
-           
-         To use the ``timestamp`` option, you must specify a time by using the
-         ``change.stream.startup.mode.timestamp.start.at.operation.time`` setting.
-         This setting accepts timestamps in the following formats:
-         
-         - An integer representing the number of seconds since the
-           :wikipedia:`Unix epoch <Unix_time>`
-         - A date and time in
-           `ISO-8601 <https://www.iso.org/iso-8601-date-and-time-format.html>`__
-           format with one-second precision
-         - An extended JSON ``BsonTimestamp``
-       
-         **Default**: ``latest``
-       
 .. _configure-input-uri:
 
 ``connection.uri`` Configuration Setting
diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index e08918cb..26cd5bcf 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -2,6 +2,7 @@
 .. _scala-read:
 .. _java-read:
 .. _scala-dataset-filters:
+.. _batch-read-from-mongodb: 
 
 =================
 Read from MongoDB
@@ -45,18 +46,6 @@ Overview
 
          .. include:: /scala/filters.txt
 
-.. important:: Inferring the Schema of a Change Stream
-
-   When the {+connector-short+} infers the schema of a data frame 
-   read from a change stream, by default,
-   it will use the schema of the underlying collection rather than that
-   of the change stream. If you set the ``change.stream.publish.full.document.only``
-   option to ``true``, the connector uses the schema of the 
-   change stream instead.
-
-   For more information on configuring a read operation, see the
-   :ref:`spark-change-stream-conf` section of the Read Configuration Options guide.
-
 SQL Queries
 -----------
 
diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index 2efa0a62..21706b08 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -1,11 +1,10 @@
 .. _spark-write-conf:
+.. _spark-batch-write-conf:
 
 ===========================
 Write Configuration Options
 ===========================
 
-.. default-domain:: mongodb
-
 .. contents:: On this page
    :local:
    :backlinks: none
@@ -13,11 +12,12 @@ Write Configuration Options
    :class: singlecol
 
 .. _spark-output-conf:
+.. _spark-batch-output-conf:
 
 Write Configuration
 -------------------
 
-The following options for writing to MongoDB are available:
+You can configure the following properties when writing data to MongoDB in batch mode:
 
 .. note::
 
@@ -169,12 +169,12 @@ The following options for writing to MongoDB are available:
          guide on the
          :manual:`WriteConcern wtimeout option </reference/write-concern/#wtimeout>`.
 
-.. _configure-output-uri:
+.. _configure-batch-output-uri:
 
 ``connection.uri`` Configuration Setting
 ----------------------------------------
 
-You can set all :ref:`spark-output-conf` via the write ``connection.uri``.
+You can set all :ref:`spark-batch-output-conf` via the write ``connection.uri``.
 
 .. note::
 
diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 5b074001..89456e5e 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -1,6 +1,7 @@
 .. _write-to-mongodb:
 .. _scala-write:
 .. _java-write:
+.. _batch-write-to-mongodb:
 
 ================
 Write to MongoDB
@@ -49,4 +50,4 @@ Write to MongoDB
    the connector writes the field name and ``null`` value to MongoDB. You can
    change this behavior by setting the write configuration property
    ``ignoreNullValues``. For more information about setting the connector's
-   write behavior, see :ref:`Write Configuration Options <spark-write-conf>`.
+   write behavior, see :ref:`Write Configuration Options <spark-batch-write-conf>`.
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index e9f43358..62678835 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -431,3 +431,16 @@ To stream data from MongoDB to your console:
             // run the query
             val query = dataStreamWriter.start()
 
+//todo
+
+.. important:: Inferring the Schema of a Change Stream
+
+   When the {+connector-short+} infers the schema of a data frame 
+   read from a change stream, by default,
+   it will use the schema of the underlying collection rather than that
+   of the change stream. If you set the ``change.stream.publish.full.document.only``
+   option to ``true``, the connector uses the schema of the 
+   change stream instead.
+
+   For more information on configuring a read operation, see the
+   :ref:`spark-change-stream-conf` section of the Read Configuration Options guide.
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index ce4404ce..3d663efd 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -201,3 +201,96 @@ database for the connection is ``foobar``:
 
   spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
    spark.mongodb.write.database=bar
+
+.. _spark-change-stream-conf:
+
+Change Streams
+--------------
+
+.. note::
+
+   If you use ``SparkConf`` to set the connector's change stream
+   configurations, prefix ``spark.mongodb.`` to each property.
+
+.. list-table::
+   :header-rows: 1
+   :widths: 35 65
+
+   * - Property name
+     - Description
+
+   * - ``change.stream.lookup.full.document``
+
+     - Determines what values your change stream returns on update
+       operations.
+
+       The default setting returns the differences between the original
+       document and the updated document.
+
+       The ``updateLookup`` setting returns the differences between the
+       original document and updated document as well as a copy of the
+       entire updated document.
+
+       **Default:** "default"
+
+       .. tip::
+
+          For more information on how this change stream option works,
+          see the MongoDB server manual guide
+          :manual:`Lookup Full Document for Update Operation </changeStreams/#lookup-full-document-for-update-operations>`.
+
+   * - ``change.stream.micro.batch.max.partition.count``
+     - | The maximum number of partitions the {+connector-short+} divides each 
+         micro-batch into. Spark workers can process these partitions in parallel.
+       |  
+       | This setting applies only when using micro-batch streams.
+       |
+       | **Default**: ``1``
+
+       .. warning:: Event Order
+
+          Specifying a value larger than ``1`` can alter the order in which
+          the {+connector-short+} processes change events. Avoid this setting
+          if out-of-order processing could create data inconsistencies downstream. 
+
+   * - ``change.stream.publish.full.document.only``
+     - | Specifies whether to publish the changed document or the full
+         change stream document.
+       |
+       | When this setting is ``true``, the connector exhibits the following behavior:
+       
+       - The connector filters out messages that
+         omit the ``fullDocument`` field and only publishes the value of the
+         field.
+       - If you don't specify a schema, the connector infers the schema
+         from the change stream document rather than from the underlying collection.
+
+         **Default**: ``false``
+       
+       .. note::
+
+          This setting overrides the ``change.stream.lookup.full.document``
+          setting.
+
+   * - ``change.stream.startup.mode``
+     - | Specifies how the connector starts up when no offset is available.
+       
+       | This setting accepts the following values:
+        
+       - ``latest``: The connector begins processing
+         change events starting with the most recent event.
+         It will not process any earlier unprocessed events.
+       - ``timestamp``: The connector begins processing change events at a specified time.
+           
+         To use the ``timestamp`` option, you must specify a time by using the
+         ``change.stream.startup.mode.timestamp.start.at.operation.time`` setting.
+         This setting accepts timestamps in the following formats:
+         
+         - An integer representing the number of seconds since the
+           :wikipedia:`Unix epoch <Unix_time>`
+         - A date and time in
+           `ISO-8601 <https://www.iso.org/iso-8601-date-and-time-format.html>`__
+           format with one-second precision
+         - An extended JSON ``BsonTimestamp``
+       
+         **Default**: ``latest``

From c5a810236175c6bd43b3109a805769fa2b1608d6 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 16 Oct 2023 16:53:34 -0500
Subject: [PATCH 19/65] wip

---
 .../streaming-mode/streaming-read-config.txt  | 195 +---------------
 .../streaming-mode/streaming-write-config.txt | 220 ++----------------
 2 files changed, 17 insertions(+), 398 deletions(-)

diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index cf99d709..b18a7409 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -15,7 +15,7 @@ Read Configuration Options
 Read Configuration
 ------------------
 
-You can configure the following properties to read from MongoDB:
+You can configure the following properties when reading data from MongoDB in streaming mode:
 
 .. note::
 
@@ -57,42 +57,6 @@ You can configure the following properties to read from MongoDB:
        |
        | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
 
-   * - ``partitioner``
-     - | The partitioner full class name.
-
-       | You can specify a custom implementation which must implement the
-         ``com.mongodb.spark.sql.connector.read.partitioner.Partitioner``
-          interface.
-       | See the
-         :ref:`Partitioner Configuration <partitioner-conf>` section for more
-         information on partitioners.
-       |
-       | **Default:** ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``
-
-   * - ``partitioner.options.``
-     - | Partitioner configuration prefix.
-       | See the
-         :ref:`Partitioner Configuration <partitioner-conf>` section for more
-         information on partitioners.
-
-   * - ``sampleSize``
-     - | The number of documents to sample from the collection when inferring
-       | the schema.
-       |
-       | **Default:** ``1000``
-
-   * - ``sql.inferSchema.mapTypes.enabled``
-     - | Whether to enable Map types when inferring the schema.
-       | When enabled, large compatible struct types are inferred to a
-         ``MapType`` instead.
-       |
-       | **Default:** ``true``
-
-   * - ``sql.inferSchema.mapTypes.minimum.key.size``
-     - | Minimum size of a ``StructType`` before inferring as a ``MapType``.
-       |
-       | **Default:** ``250``
-
    * - ``aggregation.pipeline``
      - | Specifies a custom aggregation pipeline to apply to the collection
          before sending data to Spark.
@@ -131,162 +95,6 @@ You can configure the following properties to read from MongoDB:
        |
        | **Default:** ``false``
 
-.. _partitioner-conf:
-
-Partitioner Configurations
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Partitioners change the read behavior for batch reads with the {+connector-short+}.
-They do not affect Structured Streaming because the data stream processing
-engine produces a single stream with Structured Streaming.
-
-This section contains configuration information for the following 
-partitioners:
-
-- :ref:`SamplePartitioner <conf-samplepartitioner>`
-- :ref:`ShardedPartitioner <conf-shardedpartitioner>`
-- :ref:`PaginateBySizePartitioner <conf-paginatebysizepartitioner>`
-- :ref:`PaginateIntoPartitionsPartitioner <conf-paginateintopartitionspartitioner>`
-- :ref:`SinglePartitionPartitioner <conf-singlepartitionpartitioner>`
-
-.. _conf-mongosamplepartitioner:
-.. _conf-samplepartitioner:
-
-``SamplePartitioner`` Configuration
-```````````````````````````````````
-
-.. include:: /includes/sparkconf-partitioner-options-note.rst
-
-You must specify this partitioner using the full classname:
-``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``.
-
-
-.. list-table::
-   :header-rows: 1
-   :widths: 35 65
-
-   * - Property name
-     - Description
-
-   * - ``partitioner.options.partition.field``
-     - The field to use for partitioning, which must be a unique field.
-
-       **Default:** ``_id``
-
-   * - ``partitioner.options.partition.size``
-     - The size (in MB) for each partition. Smaller partition sizes
-       create more partitions containing fewer documents.
-
-       **Default:** ``64``
-
-
-   * - ``partitioner.options.samples.per.partition``
-     - The number of samples to take per partition. The total number of
-       samples taken is:
-
-       .. code-block:: none
-
-          samples per partition * ( count / number of documents per partition)
-
-       **Default:** ``10``
-
-.. example::
-
-   For a collection with 640 documents with an average document
-   size of 0.5 MB, the default SamplePartitioner configuration values creates
-   5 partitions with 128 documents per partition.
-
-   The MongoDB Spark Connector samples 50 documents (the default 10
-   per intended partition) and defines 5 partitions by selecting
-   partition field ranges from the sampled documents.
-
-.. _conf-mongoshardedpartitioner:
-.. _conf-shardedpartitioner:
-
-``ShardedPartitioner`` Configuration
-`````````````````````````````````````
-
-The ``ShardedPartitioner`` automatically determines the partitions to use
-based on your shard configuration.
-
-You must specify this partitioner using the full classname:
-``com.mongodb.spark.sql.connector.read.partitioner.ShardedPartitioner``.
-
-.. warning::
-
-   This partitioner is not compatible with hashed shard keys.
-
-
-.. _conf-mongopaginatebysizepartitioner:
-.. _conf-paginatebysizepartitioner:
-
-``PaginateBySizePartitioner`` Configuration
-```````````````````````````````````````````
-
-.. include:: /includes/sparkconf-partitioner-options-note.rst
-
-You must specify this partitioner using the full classname:
-``com.mongodb.spark.sql.connector.read.partitioner.PaginateBySizePartitioner``.
-
-.. list-table::
-   :header-rows: 1
-   :widths: 35 65
-
-   * - Property name
-     - Description
-
-   * - ``partitioner.options.partition.field``
-     - The field to use for partitioning, which must be a unique field.
-
-       **Default:** ``_id``
-
-   * - ``partitioner.options.partition.size``
-     - The size (in MB) for each partition. Smaller partition sizes
-
-       create more partitions containing fewer documents.
-
-       **Default:** ``64``
-
-.. _conf-paginateintopartitionspartitioner:
-
-``PaginateIntoPartitionsPartitioner`` Configuration
-```````````````````````````````````````````````````
-
-.. include:: /includes/sparkconf-partitioner-options-note.rst
-
-You must specify this partitioner using the full classname:
-``com.mongodb.spark.sql.connector.read.partitioner.PaginateIntoPartitionsPartitioner``.
-
-
-.. list-table::
-   :header-rows: 1
-   :widths: 35 65
-
-   * - Property name
-     - Description
-     
-   * - ``partitioner.options.partition.field``
-     - The field to use for partitioning, which must be a unique field.
-
-       **Default:** ``_id``
-
-   * - ``partitioner.options.maxNumberOfPartitions``
-     - The number of partitions to create.
-
-       **Default:** ``64``
-
-.. _conf-singlepartitionpartitioner:
-
-``SinglePartitionPartitioner`` Configuration
-````````````````````````````````````````````
-
-.. include:: /includes/sparkconf-partitioner-options-note.rst
-
-You must specify this partitioner using the full classname:
-``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
-
-This partitioner creates a single partition.
-
 .. _spark-change-stream-conf:
 
 Change Streams
@@ -399,7 +207,6 @@ For example, consider the following example which sets the read
 
    spark.mongodb.read.connection.uri=mongodb://127.0.0.1/databaseName.collectionName?readPreference=primaryPreferred
 
-
 The configuration corresponds to the following separate configuration
 settings:
 
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index 3d663efd..5944230e 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -1,4 +1,5 @@
 .. _spark-write-conf:
+.. _spark-streaming-write-conf:
 
 ===========================
 Write Configuration Options
@@ -10,12 +11,12 @@ Write Configuration Options
    :depth: 1
    :class: singlecol
 
-.. _spark-output-conf:
+.. _spark-streaming-output-conf:
 
 Write Configuration
 -------------------
 
-The following options for writing to MongoDB are available:
+You can configure the following properties when writing data to MongoDB in streaming mode:
 
 .. note::
 
@@ -49,57 +50,6 @@ The following options for writing to MongoDB are available:
        |
        | **Default:** None 
 
-   * - ``convertJson``
-     - | Specifies whether the connector parses the string and converts extended JSON
-         into BSON.
-       |
-       | This setting accepts the following values:
-       
-       - ``any``: The connector converts all JSON values to BSON.
-
-         - ``"{a: 1}"`` becomes ``{a: 1}``.
-         - ``"[1, 2, 3]"`` becomes ``[1, 2, 3]``.
-         - ``"true"`` becomes ``true``.
-         - ``"01234"`` becomes ``1234``.
-         - ``"{a:b:c}"`` doesn't change.
-
-       - ``objectOrArrayOnly``: The connector converts only JSON objects and arrays to
-         BSON.
-
-         - ``"{a: 1}"`` becomes ``{a: 1}``. 
-         - ``"[1, 2, 3]"`` becomes ``[1, 2, 3]``. 
-         - ``"true"`` doesn't change.
-         - ``"01234"`` doesn't change.
-         - ``"{a:b:c}"`` doesn't change.
-
-       - ``false``: The connector leaves all values as strings.
-
-       | **Default:** ``false``
-   
-   * - ``idFieldList``
-     - | Field or list of fields by which to split the collection data. To
-         specify more than one field, separate them using a comma as shown
-         in the following example:
-
-       .. code-block:: none
-          :copyable: false
-
-          "fieldName1,fieldName2"
-
-       | **Default:** ``_id``
-
-   * - ``ignoreNullValues``
-     - | When ``true``, the connector ignores any ``null`` values when writing,
-         including ``null`` values in arrays and nested documents.
-       |
-       | **Default:** ``false``
-
-   * - ``maxBatchSize``
-     - | Specifies the maximum number of operations to batch in bulk
-         operations.
-       |
-       | **Default:** ``512``
-
    * - ``mongoClientFactory``
      - | MongoClientFactory configuration key.
        | You can specify a custom implementation which must implement the
@@ -107,67 +57,22 @@ The following options for writing to MongoDB are available:
          interface.
        |
        | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
-
-   * - ``operationType``
-     - | Specifies the type of write operation to perform. You can set
-         this to one of the following values:
-
-       - ``insert``: Insert the data.
-       - ``replace``: Replace an existing document that matches the
-         ``idFieldList`` value with the new data. If no match exists, the
-         value of ``upsertDocument`` indicates whether the connector
-         inserts a new document.
-       - ``update``: Update an existing document that matches the
-         ``idFieldList`` value with the new data. If no match exists, the
-         value of ``upsertDocument`` indicates whether the connector
-         inserts a new document.
-
-       |
-       | **Default:** ``replace``
-
-   * - ``ordered``
-     - | Specifies whether to perform ordered bulk operations.
-       |
-       | **Default:** ``true``
-
-   * - ``upsertDocument``
-     - | When ``true``, replace and update operations will insert the data
-         if no match exists.
+    
+   * - ``checkpointLocation``
+     - | The absolute file path of the directory to which the connector writes checkpoint
+         information.
        |
-       | For time series collections, you must set ``upsertDocument`` to
-         ``false``.
-       |
-       | **Default:** ``true``
-
-   * - ``writeConcern.journal``
-     - | Specifies ``j``, a write-concern option to enable request for
-         acknowledgment that the data is confirmed on on-disk journal for
-         the criteria specified in the ``w`` option. You can specify
-         either ``true`` or ``false``.
-       |
-       | For more information on ``j`` values, see the MongoDB server
-         guide on the
-         :manual:`WriteConcern j option </reference/write-concern/#j-option>`.
-
-   * - ``writeConcern.w``
-     - | Specifies ``w``, a write-concern option to request acknowledgment
-         that the write operation has propagated to a specified number of
-         MongoDB nodes. For a list
-         of allowed values for this option, see :manual:`WriteConcern
-         </reference/write-concern/#w-option>` in the MongoDB manual.
-       |
-       | **Default:** ``1``
-
-   * - ``writeConcern.wTimeoutMS``
-     - | Specifies ``wTimeoutMS``, a write-concern option to return an error
-         when a write operation exceeds the number of milliseconds. If you
-         use this optional setting, you must specify a nonnegative integer.
+       | For more information about checkpoints, see the
+         `Spark Structured Streaming Programming Guide <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__
+       | 
+       | **Default:** 
+   
+   * - ``forceDeleteTempCheckpointLocation``
+     - | A Boolean value that specifies whether to delete existing checkpoint data. 
        |
-       | For more information on ``wTimeoutMS`` values, see the MongoDB server
-         guide on the
-         :manual:`WriteConcern wtimeout option </reference/write-concern/#wtimeout>`.
+       | **Default:** 
 
-.. _configure-output-uri:
+.. _configure-streaming-output-uri:
 
 ``connection.uri`` Configuration Setting
 ----------------------------------------
@@ -201,96 +106,3 @@ database for the connection is ``foobar``:
 
   spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
    spark.mongodb.write.database=bar
-
-.. _spark-change-stream-conf:
-
-Change Streams
---------------
-
-.. note::
-
-   If you use ``SparkConf`` to set the connector's change stream
-   configurations, prefix ``spark.mongodb.`` to each property.
-
-.. list-table::
-   :header-rows: 1
-   :widths: 35 65
-
-   * - Property name
-     - Description
-
-   * - ``change.stream.lookup.full.document``
-
-     - Determines what values your change stream returns on update
-       operations.
-
-       The default setting returns the differences between the original
-       document and the updated document.
-
-       The ``updateLookup`` setting returns the differences between the
-       original document and updated document as well as a copy of the
-       entire updated document.
-
-       **Default:** "default"
-
-       .. tip::
-
-          For more information on how this change stream option works,
-          see the MongoDB server manual guide
-          :manual:`Lookup Full Document for Update Operation </changeStreams/#lookup-full-document-for-update-operations>`.
-
-   * - ``change.stream.micro.batch.max.partition.count``
-     - | The maximum number of partitions the {+connector-short+} divides each 
-         micro-batch into. Spark workers can process these partitions in parallel.
-       |  
-       | This setting applies only when using micro-batch streams.
-       |
-       | **Default**: ``1``
-
-       .. warning:: Event Order
-
-          Specifying a value larger than ``1`` can alter the order in which
-          the {+connector-short+} processes change events. Avoid this setting
-          if out-of-order processing could create data inconsistencies downstream. 
-
-   * - ``change.stream.publish.full.document.only``
-     - | Specifies whether to publish the changed document or the full
-         change stream document.
-       |
-       | When this setting is ``true``, the connector exhibits the following behavior:
-       
-       - The connector filters out messages that
-         omit the ``fullDocument`` field and only publishes the value of the
-         field.
-       - If you don't specify a schema, the connector infers the schema
-         from the change stream document rather than from the underlying collection.
-
-         **Default**: ``false``
-       
-       .. note::
-
-          This setting overrides the ``change.stream.lookup.full.document``
-          setting.
-
-   * - ``change.stream.startup.mode``
-     - | Specifies how the connector starts up when no offset is available.
-       
-       | This setting accepts the following values:
-        
-       - ``latest``: The connector begins processing
-         change events starting with the most recent event.
-         It will not process any earlier unprocessed events.
-       - ``timestamp``: The connector begins processing change events at a specified time.
-           
-         To use the ``timestamp`` option, you must specify a time by using the
-         ``change.stream.startup.mode.timestamp.start.at.operation.time`` setting.
-         This setting accepts timestamps in the following formats:
-         
-         - An integer representing the number of seconds since the
-           :wikipedia:`Unix epoch <Unix_time>`
-         - A date and time in
-           `ISO-8601 <https://www.iso.org/iso-8601-date-and-time-format.html>`__
-           format with one-second precision
-         - An extended JSON ``BsonTimestamp``
-       
-         **Default**: ``latest``

From ee5a6007312bd2b3543ac8b547b1722413001cf2 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 13:12:04 -0500
Subject: [PATCH 20/65] connection config

---
 source/batch-mode/batch-write-config.txt      | 35 +---------------
 source/configuration.txt                      |  2 +-
 source/includes/connection-write-config.rst   | 34 +++++++++++++++
 .../streaming-mode/streaming-write-config.txt | 42 +++----------------
 4 files changed, 41 insertions(+), 72 deletions(-)
 create mode 100644 source/includes/connection-write-config.rst

diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index 21706b08..7f66a306 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -169,37 +169,4 @@ You can configure the following properties when writing data to MongoDB in batch
          guide on the
          :manual:`WriteConcern wtimeout option </reference/write-concern/#wtimeout>`.
 
-.. _configure-batch-output-uri:
-
-``connection.uri`` Configuration Setting
-----------------------------------------
-
-You can set all :ref:`spark-batch-output-conf` via the write ``connection.uri``.
-
-.. note::
-
-   If you use ``SparkConf`` to set the connector's write configurations,
-   prefix ``spark.mongodb.write.`` to the setting.
-
-.. code:: cfg
-
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection
-
-The configuration corresponds to the following separate configuration
-settings:
-
-.. code:: cfg
-
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
-   spark.mongodb.write.database=test
-   spark.mongodb.write.collection=myCollection
-
-If you specify a setting both in the ``connection.uri`` and in a separate
-configuration, the ``connection.uri`` setting overrides the separate
-setting. For example, in the following configuration, the
-database for the connection is ``foobar``:
-
-.. code:: cfg
-
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
-   spark.mongodb.write.database=bar
+.. include:: /includes/connection-write-config.rst
diff --git a/source/configuration.txt b/source/configuration.txt
index 8ecf00fb..ec827f53 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -123,4 +123,4 @@ available. You must specify these settings by using a JVM system property.
 
 .. tip:: System Properties
 
-   For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
\ No newline at end of file
+   For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
diff --git a/source/includes/connection-write-config.rst b/source/includes/connection-write-config.rst
new file mode 100644
index 00000000..feefa7c6
--- /dev/null
+++ b/source/includes/connection-write-config.rst
@@ -0,0 +1,34 @@
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
+If you're using ``SparkConf``, you can specify all the previous settings either
+individually or combined in the write ``connection.uri`` setting.
+
+The following code examples show how to specify ``connection.uri``,
+``database``, and ``collection`` settings both separately and in ``connection.uri``:
+
+- Separately:
+
+.. code:: cfg
+
+   spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
+   spark.mongodb.write.database=test
+   spark.mongodb.write.collection=myCollection
+
+- In ``connection.uri``:
+
+.. code:: cfg
+
+  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection
+
+.. important:: connection.uri Takes Precedence
+
+   If you specify a setting in both the ``connection.uri`` and on its own line,
+   the ``connection.uri`` setting takes precedence.
+   For example, in the following configuration, the connection
+   database is ``foobar``:
+
+   .. code:: cfg
+
+      spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
+      spark.mongodb.write.database=bar
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index 5944230e..0319eade 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -12,11 +12,12 @@ Write Configuration Options
    :class: singlecol
 
 .. _spark-streaming-output-conf:
+.. _spark-output-conf:
 
 Write Configuration
 -------------------
 
-You can configure the following properties when writing data to MongoDB in streaming mode:
+You can configure the following properties when writing data to MongoDB in streaming mode.
 
 .. note::
 
@@ -65,44 +66,11 @@ You can configure the following properties when writing data to MongoDB in strea
        | For more information about checkpoints, see the
          `Spark Structured Streaming Programming Guide <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__
        | 
-       | **Default:** 
+       | **Default:** None 
    
    * - ``forceDeleteTempCheckpointLocation``
      - | A Boolean value that specifies whether to delete existing checkpoint data. 
        |
-       | **Default:** 
-
-.. _configure-streaming-output-uri:
-
-``connection.uri`` Configuration Setting
-----------------------------------------
-
-You can set all :ref:`spark-output-conf` via the write ``connection.uri``.
-
-.. note::
-
-   If you use ``SparkConf`` to set the connector's write configurations,
-   prefix ``spark.mongodb.write.`` to the setting.
-
-.. code:: cfg
-
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection
-
-The configuration corresponds to the following separate configuration
-settings:
-
-.. code:: cfg
-
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
-   spark.mongodb.write.database=test
-   spark.mongodb.write.collection=myCollection
-
-If you specify a setting both in the ``connection.uri`` and in a separate
-configuration, the ``connection.uri`` setting overrides the separate
-setting. For example, in the following configuration, the
-database for the connection is ``foobar``:
-
-.. code:: cfg
+       | **Default:** False 
 
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
-   spark.mongodb.write.database=bar
+.. include:: /includes/connection-write-config.rst

From bbec2b9f04014a29839fff17106cae7db558d912 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 13:16:47 -0500
Subject: [PATCH 21/65] shared config

---
 source/batch-mode/batch-write-config.txt      | 30 ++-----------------
 source/includes/shared-config-settings.rst    | 27 +++++++++++++++++
 .../streaming-mode/streaming-write-config.txt |  2 +-
 3 files changed, 30 insertions(+), 29 deletions(-)
 create mode 100644 source/includes/shared-config-settings.rst

diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index 7f66a306..a0a791cb 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -31,26 +31,8 @@ You can configure the following properties when writing data to MongoDB in batch
    * - Property name
      - Description
    
-   * - ``connection.uri``
-     - | **Required.**
-       | The connection string configuration key.
-       |
-       | **Default:** ``mongodb://localhost:27017/``
-
-   * - ``database``
-     - | **Required.**
-       | The database name configuration.
-
-   * - ``collection``
-     - | **Required.**
-       | The collection name configuration.
-
-   * - ``comment``
-     - | The comment to append to the write operation. Comments appear in the 
-         :manual:`output of the Database Profiler. </reference/database-profiler>`
-       |
-       | **Default:** None 
-
+   .. include:: /includes/shared-config-settings.rst
+   
    * - ``convertJson``
      - | Specifies whether the connector parses the string and converts extended JSON
          into BSON.
@@ -102,14 +84,6 @@ You can configure the following properties when writing data to MongoDB in batch
        |
        | **Default:** ``512``
 
-   * - ``mongoClientFactory``
-     - | MongoClientFactory configuration key.
-       | You can specify a custom implementation which must implement the
-         ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
-         interface.
-       |
-       | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
-
    * - ``operationType``
      - | Specifies the type of write operation to perform. You can set
          this to one of the following values:
diff --git a/source/includes/shared-config-settings.rst b/source/includes/shared-config-settings.rst
new file mode 100644
index 00000000..ee59a1c5
--- /dev/null
+++ b/source/includes/shared-config-settings.rst
@@ -0,0 +1,27 @@
+* - ``connection.uri``
+  - | **Required.**
+    | The connection string configuration key.
+    |
+    | **Default:** ``mongodb://localhost:27017/``
+
+* - ``database``
+  - | **Required.**
+    | The database name configuration.
+
+* - ``collection``
+  - | **Required.**
+    | The collection name configuration.
+
+* - ``comment``
+  - | The comment to append to the write operation. Comments appear in the 
+      :manual:`output of the Database Profiler. </reference/database-profiler>`
+    |
+    | **Default:** None 
+
+* - ``mongoClientFactory``
+  - | MongoClientFactory configuration key.
+    | You can specify a custom implementation that must implement the
+      ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
+      interface.
+    |
+    | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index 0319eade..7e5b4c56 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -71,6 +71,6 @@ You can configure the following properties when writing data to MongoDB in strea
    * - ``forceDeleteTempCheckpointLocation``
      - | A Boolean value that specifies whether to delete existing checkpoint data. 
        |
-       | **Default:** False 
+       | **Default:** ``false`` 
 
 .. include:: /includes/connection-write-config.rst

From f31a54d2f963adbbfe844a7518a818e5b8a3b648 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 15:18:32 -0500
Subject: [PATCH 22/65] wip

---
 source/batch-mode/batch-read-config.txt       | 47 ++----------------
 source/batch-mode/batch-write-config.txt      | 37 ++++++++++----
 source/configuration.txt                      | 11 +++--
 source/includes/conf-read-prefix.rst          |  4 ++
 source/includes/conf-write-prefix.rst         |  4 ++
 source/includes/connection-read-config.rst    | 34 +++++++++++++
 source/includes/shared-config-settings.rst    | 27 -----------
 .../streaming-mode/streaming-read-config.txt  | 48 ++-----------------
 .../streaming-mode/streaming-write-config.txt |  9 +---
 9 files changed, 88 insertions(+), 133 deletions(-)
 create mode 100644 source/includes/conf-read-prefix.rst
 create mode 100644 source/includes/conf-write-prefix.rst
 create mode 100644 source/includes/connection-read-config.rst
 delete mode 100644 source/includes/shared-config-settings.rst

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index bef5ed1e..b7c19457 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -17,12 +17,9 @@ Read Configuration Options
 Read Configuration
 ------------------
 
-You can configure the following properties when reading data from MongoDB in batch mode:
+You can configure the following properties when reading data from MongoDB in batch mode.
 
-.. note::
-
-   If you use ``SparkConf`` to set the connector's read configurations,
-   prefix ``spark.mongodb.read.`` to each property.
+.. include:: /includes/conf-read-prefix.rst
 
 .. list-table::
    :header-rows: 1
@@ -282,42 +279,4 @@ You must specify this partitioner using the full classname:
 
 This partitioner creates a single partition.
 
-.. _configure-input-uri:
-
-``connection.uri`` Configuration Setting
-----------------------------------------
-
-You can set all :ref:`spark-input-conf` via the read ``connection.uri`` setting.
-
-For example, consider the following example which sets the read
-``connection.uri`` setting:
-
-.. note::
-
-   If you use ``SparkConf`` to set the connector's read configurations,
-   prefix ``spark.mongodb.read.`` to the setting.
-
-.. code:: cfg
-
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/databaseName.collectionName?readPreference=primaryPreferred
-
-
-The configuration corresponds to the following separate configuration
-settings:
-
-.. code:: cfg
-
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
-   spark.mongodb.read.database=databaseName
-   spark.mongodb.read.collection=collectionName
-   spark.mongodb.read.readPreference.name=primaryPreferred
-
-If you specify a setting both in the ``connection.uri`` and in a separate
-configuration, the ``connection.uri`` setting overrides the separate
-setting. For example, given the following configuration, the
-database for the connection is ``foobar``:
-
-.. code:: cfg
-
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/foobar
-   spark.mongodb.read.database=bar
+.. include:: /includes/connection-read-config.rst
\ No newline at end of file
diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index a0a791cb..70dbd524 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -1,4 +1,3 @@
-.. _spark-write-conf:
 .. _spark-batch-write-conf:
 
 ===========================
@@ -11,7 +10,6 @@ Write Configuration Options
    :depth: 1
    :class: singlecol
 
-.. _spark-output-conf:
 .. _spark-batch-output-conf:
 
 Write Configuration
@@ -19,10 +17,7 @@ Write Configuration
 
 You can configure the following properties when writing data to MongoDB in batch mode:
 
-.. note::
-
-   If you use ``SparkConf`` to set the connector's write configurations,
-   prefix ``spark.mongodb.write.`` to each property.
+.. include:: /includes/conf-write-prefix.rst
 
 .. list-table::
    :header-rows: 1
@@ -31,8 +26,34 @@ You can configure the following properties when writing data to MongoDB in batch
    * - Property name
      - Description
    
-   .. include:: /includes/shared-config-settings.rst
-   
+   * - ``connection.uri``
+     - | **Required.**
+       | The connection string configuration key.
+       |
+       | **Default:** ``mongodb://localhost:27017/``
+
+   * - ``database``
+     - | **Required.**
+       | The database name configuration.
+
+   * - ``collection``
+     - | **Required.**
+       | The collection name configuration.
+
+   * - ``comment``
+     - | The comment to append to the write operation. Comments appear in the 
+         :manual:`output of the Database Profiler. </reference/database-profiler>`
+       |
+       | **Default:** None 
+
+   * - ``mongoClientFactory``
+     - | MongoClientFactory configuration key.
+       | You can specify a custom implementation that must implement the
+         ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
+         interface.
+       |
+       | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
+
    * - ``convertJson``
      - | Specifies whether the connector parses the string and converts extended JSON
          into BSON.
diff --git a/source/configuration.txt b/source/configuration.txt
index ec827f53..7a2a5998 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -10,9 +10,14 @@ Configuring Spark
    :depth: 1
    :class: singlecol
 
-Various configuration options are available for the MongoDB Spark
-Connector. To learn more about the options you can set, see 
-:ref:`spark-write-conf` and :ref:`spark-read-conf`.
+You can configure read and write operations in both batch and streaming mode.
+To learn more about the available configuration options, see the following
+pages:
+
+- :ref:`spark-batch-read-conf`
+- :ref:`spark-batch-write-conf`
+- :ref:`spark-streaming-read-conf`
+- :ref:`spark-streaming-write-conf`
 
 Specify Configuration
 ---------------------
diff --git a/source/includes/conf-read-prefix.rst b/source/includes/conf-read-prefix.rst
new file mode 100644
index 00000000..6ba8d7cd
--- /dev/null
+++ b/source/includes/conf-read-prefix.rst
@@ -0,0 +1,4 @@
+.. note::
+
+   If you use ``SparkConf`` to set the connector's read configurations,
+   prefix ``spark.mongodb.read.`` to each property.
diff --git a/source/includes/conf-write-prefix.rst b/source/includes/conf-write-prefix.rst
new file mode 100644
index 00000000..b6d0256c
--- /dev/null
+++ b/source/includes/conf-write-prefix.rst
@@ -0,0 +1,4 @@
+.. note::
+
+   If you use ``SparkConf`` to set the connector's write configurations,
+   prefix ``spark.mongodb.write.`` to each property.
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
new file mode 100644
index 00000000..61be8fcc
--- /dev/null
+++ b/source/includes/connection-read-config.rst
@@ -0,0 +1,34 @@
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
+If you're using ``SparkConf``, you can specify all the previous settings either
+individually or combined in the read ``connection.uri`` setting.
+
+The following code examples show how to specify ``connection.uri``,
+``database``, and ``collection`` settings both separately and in ``connection.uri``:
+
+- Separately:
+
+.. code:: cfg
+
+   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
+   spark.mongodb.read.database=test
+   spark.mongodb.read.collection=myCollection
+
+- In ``connection.uri``:
+
+.. code:: cfg
+
+  spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection
+
+.. important:: connection.uri Takes Precedence
+
+   If you specify a setting in both the ``connection.uri`` and on its own line,
+   the ``connection.uri`` setting takes precedence.
+   For example, in the following configuration, the connection
+   database is ``foobar``:
+
+   .. code:: cfg
+
+      spark.mongodb.read.connection.uri=mongodb://127.0.0.1/foobar
+      spark.mongodb.read.database=bar
diff --git a/source/includes/shared-config-settings.rst b/source/includes/shared-config-settings.rst
deleted file mode 100644
index ee59a1c5..00000000
--- a/source/includes/shared-config-settings.rst
+++ /dev/null
@@ -1,27 +0,0 @@
-* - ``connection.uri``
-  - | **Required.**
-    | The connection string configuration key.
-    |
-    | **Default:** ``mongodb://localhost:27017/``
-
-* - ``database``
-  - | **Required.**
-    | The database name configuration.
-
-* - ``collection``
-  - | **Required.**
-    | The collection name configuration.
-
-* - ``comment``
-  - | The comment to append to the write operation. Comments appear in the 
-      :manual:`output of the Database Profiler. </reference/database-profiler>`
-    |
-    | **Default:** None 
-
-* - ``mongoClientFactory``
-  - | MongoClientFactory configuration key.
-    | You can specify a custom implementation that must implement the
-      ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
-      interface.
-    |
-    | **Default:** ``com.mongodb.spark.sql.connector.connection.DefaultMongoClientFactory``
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index b18a7409..a1fc3dd8 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -15,12 +15,9 @@ Read Configuration Options
 Read Configuration
 ------------------
 
-You can configure the following properties when reading data from MongoDB in streaming mode:
+You can configure the following properties when reading data from MongoDB in streaming mode.
 
-.. note::
-
-   If you use ``SparkConf`` to set the connector's read configurations,
-   prefix ``spark.mongodb.read.`` to each property.
+.. include:: /includes/conf-read-prefix.rst
 
 .. list-table::
    :header-rows: 1
@@ -187,42 +184,5 @@ Change Streams
          - An extended JSON ``BsonTimestamp``
        
          **Default**: ``latest``
-       
-.. _configure-input-uri:
-
-``connection.uri`` Configuration Setting
-----------------------------------------
-
-You can set all :ref:`spark-input-conf` via the read ``connection.uri`` setting.
-
-For example, consider the following example which sets the read
-``connection.uri`` setting:
-
-.. note::
-
-   If you use ``SparkConf`` to set the connector's read configurations,
-   prefix ``spark.mongodb.read.`` to the setting.
-
-.. code:: cfg
-
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/databaseName.collectionName?readPreference=primaryPreferred
-
-The configuration corresponds to the following separate configuration
-settings:
-
-.. code:: cfg
-
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
-   spark.mongodb.read.database=databaseName
-   spark.mongodb.read.collection=collectionName
-   spark.mongodb.read.readPreference.name=primaryPreferred
-
-If you specify a setting both in the ``connection.uri`` and in a separate
-configuration, the ``connection.uri`` setting overrides the separate
-setting. For example, given the following configuration, the
-database for the connection is ``foobar``:
-
-.. code:: cfg
-
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/foobar
-   spark.mongodb.read.database=bar
+ 
+.. include:: /includes/connection-read-config.rst
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index 7e5b4c56..8ffbe8b6 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -1,4 +1,3 @@
-.. _spark-write-conf:
 .. _spark-streaming-write-conf:
 
 ===========================
@@ -12,17 +11,13 @@ Write Configuration Options
    :class: singlecol
 
 .. _spark-streaming-output-conf:
-.. _spark-output-conf:
 
 Write Configuration
 -------------------
 
 You can configure the following properties when writing data to MongoDB in streaming mode.
 
-.. note::
-
-   If you use ``SparkConf`` to set the connector's write configurations,
-   prefix ``spark.mongodb.write.`` to each property.
+.. include:: /includes/conf-write-prefix.rst
 
 .. list-table::
    :header-rows: 1
@@ -53,7 +48,7 @@ You can configure the following properties when writing data to MongoDB in strea
 
    * - ``mongoClientFactory``
      - | MongoClientFactory configuration key.
-       | You can specify a custom implementation which must implement the
+       | You can specify a custom implementation that must implement the
          ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
          interface.
        |

From 94692b3087f00feebdb0beddcb62248e4771dc3c Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 15:54:28 -0500
Subject: [PATCH 23/65] wip

---
 source/batch-mode/batch-read-config.txt    | 14 +---
 source/batch-mode/batch-read.txt           |  6 +-
 source/configuration.txt                   |  6 --
 source/faq.txt                             |  4 +-
 source/getting-started.txt                 |  7 +-
 source/includes/extracts-command-line.yaml | 91 +++++++++++-----------
 source/java/api.txt                        |  4 +-
 source/java/read-from-mongodb.txt          |  4 +-
 source/scala/api.txt                       |  4 +-
 source/scala/read-from-mongodb.txt         |  4 +-
 source/streaming-mode/streaming-read.txt   |  9 ---
 11 files changed, 63 insertions(+), 90 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index b7c19457..2e1a155b 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -1,4 +1,3 @@
-.. _spark-read-conf:
 .. _spark-batch-read-conf:
 
 ==========================
@@ -11,7 +10,6 @@ Read Configuration Options
    :depth: 1
    :class: singlecol
 
-.. _spark-input-conf:
 .. _spark-batch-input-conf:
 
 Read Configuration
@@ -64,7 +62,7 @@ You can configure the following properties when reading data from MongoDB in bat
           interface.
        | See the
          :ref:`Partitioner Configuration <partitioner-conf>` section for more
-         information on partitioners.
+         information about partitioners.
        |
        | **Default:** ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``
 
@@ -72,7 +70,7 @@ You can configure the following properties when reading data from MongoDB in bat
      - | Partitioner configuration prefix.
        | See the
          :ref:`Partitioner Configuration <partitioner-conf>` section for more
-         information on partitioners.
+         information about partitioners.
 
    * - ``sampleSize``
      - | The number of documents to sample from the collection when inferring
@@ -152,8 +150,7 @@ partitioners:
 .. _conf-samplepartitioner:
 
 ``SamplePartitioner`` Configuration
-
-.. include:: /includes/sparkconf-partitioner-options-note.rst
+```````````````````````````````````
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``.
@@ -217,8 +214,6 @@ You must specify this partitioner using the full classname:
 ``PaginateBySizePartitioner`` Configuration
 ```````````````````````````````````````````
 
-.. include:: /includes/sparkconf-partitioner-options-note.rst
-
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateBySizePartitioner``.
 
@@ -245,7 +240,6 @@ You must specify this partitioner using the full classname:
 
 ``PaginateIntoPartitionsPartitioner`` Configuration
 ```````````````````````````````````````````````````
-.. include:: /includes/sparkconf-partitioner-options-note.rst
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateIntoPartitionsPartitioner``.
@@ -272,8 +266,6 @@ You must specify this partitioner using the full classname:
 ``SinglePartitionPartitioner`` Configuration
 ````````````````````````````````````````````
 
-.. include:: /includes/sparkconf-partitioner-options-note.rst
-
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
 
diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 26cd5bcf..398a1d8b 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -1,8 +1,4 @@
-.. _read-from-mongodb: 
-.. _scala-read:
-.. _java-read:
-.. _scala-dataset-filters:
-.. _batch-read-from-mongodb: 
+.. _batch-read-from-mongodb:
 
 =================
 Read from MongoDB
diff --git a/source/configuration.txt b/source/configuration.txt
index 7a2a5998..005185eb 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -59,12 +59,6 @@ the following approaches:
 The MongoDB Spark Connector will use the settings in ``SparkConf`` as 
 defaults.
 
-.. important::
-
-   When setting configurations with ``SparkConf``, you must prefix the
-   configuration options. Refer to :ref:`spark-write-conf` and 
-   :ref:`spark-read-conf` for the specific prefixes.
-
 .. _options-map:
 
 Using an Options Map
diff --git a/source/faq.txt b/source/faq.txt
index d3d3c270..f48cd135 100644
--- a/source/faq.txt
+++ b/source/faq.txt
@@ -25,8 +25,8 @@ To promote data locality,
   :binary:`~bin.mongod`.
 
 - For a sharded cluster, you should have a :binary:`~bin.mongos` on the
-  same nodes and use :ref:`localThreshold <spark-input-conf>`
-  configuration to connect to the nearest :binary:`~bin.mongos`. 
+  same nodes and use the ``localThreshold``
+  configuration setting to connect to the nearest :binary:`~bin.mongos`. 
   To partition the data by shard use the 
   :ref:`conf-shardedpartitioner`.
 
diff --git a/source/getting-started.txt b/source/getting-started.txt
index c6f71d55..80dc525e 100644
--- a/source/getting-started.txt
+++ b/source/getting-started.txt
@@ -45,7 +45,8 @@ Getting Started
 Tutorials
 ---------
 
-- :doc:`write-to-mongodb`
-- :doc:`read-from-mongodb`
-- :doc:`structured-streaming`
+- :ref:`batch-write-to-mongodb`
+- :ref:`batch-read-from-mongodb`
+- :ref:`streaming-write-from-mongodb`
+- :ref:`streaming-read-from-mongodb`
 
diff --git a/source/includes/extracts-command-line.yaml b/source/includes/extracts-command-line.yaml
index 21c584be..cb437c33 100644
--- a/source/includes/extracts-command-line.yaml
+++ b/source/includes/extracts-command-line.yaml
@@ -1,79 +1,78 @@
 ref: list-command-line-specification
 content: |
-   - the ``--packages`` option to download the MongoDB Spark Connector
-     package.  The following package is available:
+  - the ``--packages`` option to download the MongoDB Spark Connector
+    package.  The following package is available:
 
-     - ``mongo-spark-connector``
+    - ``mongo-spark-connector``
 
-   - the ``--conf`` option to configure the MongoDB Spark Connnector.
-     These settings configure the ``SparkConf`` object.
+  - the ``--conf`` option to configure the MongoDB Spark Connnector.
+    These settings configure the ``SparkConf`` object.
 
-     .. note:: 
+    .. note:: 
 
-        When specifying the Connector configuration via ``SparkConf``, you
-        must prefix the settings appropriately. For details and other
-        available MongoDB Spark Connector options, see the
-        :doc:`/configuration`.
+       When specifying the Connector configuration via ``SparkConf``, you
+       must prefix the settings appropriately. For details and other
+       available MongoDB Spark Connector options, see the
+       :doc:`/configuration`.
 ---
 ref: list-configuration-explanation
 content: |
-   - The :ref:`spark.mongodb.read.connection.uri <spark-input-conf>` specifies the
-     MongoDB server address (``127.0.0.1``), the database to connect
-     (``test``), and the collection (``myCollection``) from which to read
-     data, and the read preference.
-   - The :ref:`spark.mongodb.write.connection.uri <spark-output-conf>` specifies the
-     MongoDB server address (``127.0.0.1``), the database to connect
-     (``test``), and the collection (``myCollection``) to which to write
-     data. Connects to port ``27017`` by default.
-   - The ``packages`` option specifies the Spark Connector's
-     Maven coordinates, in the format ``groupId:artifactId:version``.
+  - The ``spark.mongodb.read.connection.uri`` specifies the
+    MongoDB server address (``127.0.0.1``), the database to connect
+    (``test``), and the collection (``myCollection``) from which to read
+    data, and the read preference.
+  - The :ref:`spark.mongodb.write.connection.uri <spark-output-conf>` specifies the
+    MongoDB server address (``127.0.0.1``), the database to connect
+    (``test``), and the collection (``myCollection``) to which to write
+    data. Connects to port ``27017`` by default.
+  - The ``packages`` option specifies the Spark Connector's
+    Maven coordinates, in the format ``groupId:artifactId:version``.
 ---
 ref: command-line-start-spark-shell
 content: |
 
-   .. include:: /includes/extracts/list-command-line-specification.rst
+  .. include:: /includes/extracts/list-command-line-specification.rst
 
-   For example,
+  For example,
 
-   .. code-block:: sh
+  .. code-block:: sh
 
-      ./bin/spark-shell --conf "spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred" \
-                        --conf "spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection" \
-                        --packages org.mongodb.spark:{+artifact-id-2-12+}:{+current-version+}
- 
-   .. include:: /includes/extracts/list-configuration-explanation.rst
+     ./bin/spark-shell --conf "spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred" \
+                       --conf "spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection" \
+                       --packages org.mongodb.spark:{+artifact-id-2-12+}:{+current-version+}
+
+  .. include:: /includes/extracts/list-configuration-explanation.rst
 
 ---
 ref: command-line-start-pyspark
 content: |
 
-   .. include:: /includes/extracts/list-command-line-specification.rst
+  .. include:: /includes/extracts/list-command-line-specification.rst
+
+  The following example starts the ``pyspark`` shell from the command
+  line:
 
-   The following example starts the ``pyspark`` shell from the command
-   line:
+  .. code-block:: sh
 
-   .. code-block:: sh
+     ./bin/pyspark --conf "spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred" \
+                   --conf "spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection" \
+                   --packages org.mongodb.spark:{+artifact-id-2-12+}:{+current-version+}
 
-      ./bin/pyspark --conf "spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred" \
-                    --conf "spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection" \
-                    --packages org.mongodb.spark:{+artifact-id-2-12+}:{+current-version+}
- 
-   .. include:: /includes/extracts/list-configuration-explanation.rst
+  .. include:: /includes/extracts/list-configuration-explanation.rst
 
-   The examples in this tutorial will use this database and collection.
+  The examples in this tutorial will use this database and collection.
 ---
 ref: command-line-start-sparkR
 content: |
 
-   .. include:: /includes/extracts/list-command-line-specification.rst
+  .. include:: /includes/extracts/list-command-line-specification.rst
 
-   For example,
+  For example,
 
-   .. code-block:: sh
+  .. code-block:: sh
 
-      ./bin/sparkR  --conf "spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred" \
-                    --conf "spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection" \
-                    --packages org.mongodb.spark:{+artifact-id-2-12+}:{+current-version+}
+     ./bin/sparkR  --conf "spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred" \
+                   --conf "spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection" \
+                   --packages org.mongodb.spark:{+artifact-id-2-12+}:{+current-version+}
 
-   .. include:: /includes/extracts/list-configuration-explanation.rst
-...
+  .. include:: /includes/extracts/list-configuration-explanation.rst
diff --git a/source/java/api.txt b/source/java/api.txt
index c9a1cede..4377f9fb 100644
--- a/source/java/api.txt
+++ b/source/java/api.txt
@@ -73,12 +73,12 @@ Configuration
      }
    }
    
-- The :ref:`spark.mongodb.read.connection.uri <spark-input-conf>` specifies the
+- The ``spark.mongodb.read.connection.uri`` specifies the
   MongoDB server  address(``127.0.0.1``), the database to connect
   (``test``), and the collection (``myCollection``) from which to read
   data, and the read preference.
 
-- The :ref:`spark.mongodb.write.connection.uri <spark-output-conf>` specifies the
+- The ``spark.mongodb.write.connection.uri`` specifies the
   MongoDB server address(``127.0.0.1``), the database to connect
   (``test``), and the collection (``myCollection``) to which to write
   data.
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index d8b976a5..43554e49 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -13,8 +13,8 @@ The following example loads the collection specified in the
 
    Dataset<Row> df = spark.read().format("mongodb").load(); // Uses the SparkConf for configuration
 
-To specify a different collection, database, and other :ref:`read
-configuration settings <spark-input-conf>`, use the ``option`` method:
+To specify a different collection, database, and other read
+configuration settings, use the ``option`` method:
 
 .. code-block:: java
 
diff --git a/source/scala/api.txt b/source/scala/api.txt
index aca501d0..22826d7e 100644
--- a/source/scala/api.txt
+++ b/source/scala/api.txt
@@ -22,8 +22,8 @@ Connect to MongoDB
 ~~~~~~~~~~~~~~~~~~
 
 Connection to MongoDB happens automatically when a Dataset 
-action requires a :ref:`read <scala-read>` from MongoDB or a
-:ref:`write <scala-write>` to MongoDB.
+action requires a read from MongoDB or a
+write to MongoDB.
 
 .. _scala-app:
 
diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index f5213dcf..52a15b1a 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -13,8 +13,8 @@ The following example loads the collection specified in the
 
    val df = spark.read.format("mongodb").load() // Uses the SparkConf for configuration
 
-To specify a different collection, database, and other :ref:`read
-configuration settings <spark-input-conf>`, use the ``option`` method:
+To specify a different collection, database, and other read
+configuration settings, use the ``option`` method:
 
 .. code-block:: scala
 
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index 62678835..a41a84e0 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -1,13 +1,4 @@
-.. _read-from-mongodb: 
-.. _scala-read:
-.. _java-read:
-.. _scala-dataset-filters:
 .. _streaming-read-from-mongodb: 
-.. _streaming-scala-read:
-.. _streaming-java-read:
-.. _streaming-scala-dataset-filters:
-.. _read-structured-stream:
-.. _continuous-processing:
 
 =================
 Read from MongoDB

From f2343d973a3bf92062d6b9549f1b9ba1051b1b3c Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 16:00:45 -0500
Subject: [PATCH 24/65] wip

---
 source/batch-mode/batch-read-config.txt          | 3 ---
 source/batch-mode/batch-write-config.txt         | 3 ---
 source/streaming-mode/streaming-read-config.txt  | 3 ---
 source/streaming-mode/streaming-write-config.txt | 3 ---
 4 files changed, 12 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index 2e1a155b..59455ed1 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -12,9 +12,6 @@ Read Configuration Options
 
 .. _spark-batch-input-conf:
 
-Read Configuration
-------------------
-
 You can configure the following properties when reading data from MongoDB in batch mode.
 
 .. include:: /includes/conf-read-prefix.rst
diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index 70dbd524..de3a2482 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -12,9 +12,6 @@ Write Configuration Options
 
 .. _spark-batch-output-conf:
 
-Write Configuration
--------------------
-
 You can configure the following properties when writing data to MongoDB in batch mode:
 
 .. include:: /includes/conf-write-prefix.rst
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index a1fc3dd8..ee0edba7 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -12,9 +12,6 @@ Read Configuration Options
 
 .. _spark-streaming-input-conf:
 
-Read Configuration
-------------------
-
 You can configure the following properties when reading data from MongoDB in streaming mode.
 
 .. include:: /includes/conf-read-prefix.rst
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index 8ffbe8b6..bece6336 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -12,9 +12,6 @@ Write Configuration Options
 
 .. _spark-streaming-output-conf:
 
-Write Configuration
--------------------
-
 You can configure the following properties when writing data to MongoDB in streaming mode.
 
 .. include:: /includes/conf-write-prefix.rst

From 42fc16999d80a8acdaf2d7b7c96836222e81e888 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 16:07:23 -0500
Subject: [PATCH 25/65] test

---
 source/batch-mode/batch-read-config.txt | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index 59455ed1..c9b0abc1 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -128,7 +128,7 @@ You can configure the following properties when reading data from MongoDB in bat
 .. _partitioner-conf:
 
 Partitioner Configurations
-~~~~~~~~~~~~~~~~~~~~~~~~~~
+--------------------------
 
 Partitioners change the read behavior for batch reads with the {+connector-short+}.
 They do not affect Structured Streaming because the data stream processing
@@ -147,7 +147,7 @@ partitioners:
 .. _conf-samplepartitioner:
 
 ``SamplePartitioner`` Configuration
-```````````````````````````````````
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``.
@@ -194,7 +194,8 @@ You must specify this partitioner using the full classname:
 .. _conf-shardedpartitioner:
 
 ``ShardedPartitioner`` Configuration
-`````````````````````````````````````
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
 The ``ShardedPartitioner`` automatically determines the partitions to use
 based on your shard configuration.
 
@@ -209,7 +210,7 @@ You must specify this partitioner using the full classname:
 .. _conf-paginatebysizepartitioner:
 
 ``PaginateBySizePartitioner`` Configuration
-```````````````````````````````````````````
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateBySizePartitioner``.
@@ -236,7 +237,7 @@ You must specify this partitioner using the full classname:
 .. _conf-paginateintopartitionspartitioner:
 
 ``PaginateIntoPartitionsPartitioner`` Configuration
-```````````````````````````````````````````````````
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateIntoPartitionsPartitioner``.
@@ -261,7 +262,7 @@ You must specify this partitioner using the full classname:
 .. _conf-singlepartitionpartitioner:
 
 ``SinglePartitionPartitioner`` Configuration
-````````````````````````````````````````````
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 You must specify this partitioner using the full classname:
 ``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.

From 7dbc14acc801577ac2a675d4773c3c2f65bd947f Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 17 Oct 2023 16:37:14 -0500
Subject: [PATCH 26/65] batch read config

---
 source/batch-mode/batch-read-config.txt | 41 ++++++++++++++++---------
 1 file changed, 27 insertions(+), 14 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index c9b0abc1..b8796f15 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -54,7 +54,7 @@ You can configure the following properties when reading data from MongoDB in bat
    * - ``partitioner``
      - | The partitioner full class name.
 
-       | You can specify a custom implementation which must implement the
+       | You can specify a custom implementation that must implement the
          ``com.mongodb.spark.sql.connector.read.partitioner.Partitioner``
           interface.
        | See the
@@ -130,9 +130,8 @@ You can configure the following properties when reading data from MongoDB in bat
 Partitioner Configurations
 --------------------------
 
-Partitioners change the read behavior for batch reads with the {+connector-short+}.
-They do not affect Structured Streaming because the data stream processing
-engine produces a single stream with Structured Streaming.
+Partitioners change the read behavior of batch reads that use the {+connector-short+}. By
+dividing the data into partitions, you can run transformations in parallel.
 
 This section contains configuration information for the following 
 partitioners:
@@ -143,13 +142,21 @@ partitioners:
 - :ref:`PaginateIntoPartitionsPartitioner <conf-paginateintopartitionspartitioner>`
 - :ref:`SinglePartitionPartitioner <conf-singlepartitionpartitioner>`
 
+.. note:: Batch Reads Only
+  
+   Because the data-stream-processing engine produces a single data stream,
+   partitioners do not affect streaming reads.
+
 .. _conf-mongosamplepartitioner:
 .. _conf-samplepartitioner:
 
 ``SamplePartitioner`` Configuration
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You must specify this partitioner using the full classname:
+``SamplePartitioner`` is the default partitioner configuration. This configuration
+lets you specify a partition field, partition size, and number of samples per partition.
+
+To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.SamplePartitioner``.
 
 .. list-table::
@@ -183,10 +190,10 @@ You must specify this partitioner using the full classname:
 .. example::
 
    For a collection with 640 documents with an average document
-   size of 0.5 MB, the default SamplePartitioner configuration values creates
+   size of 0.5 MB, the default ``SamplePartitioner`` configuration creates
    5 partitions with 128 documents per partition.
 
-   The MongoDB Spark Connector samples 50 documents (the default 10
+   The {+connector-short+} samples 50 documents (the default 10
    per intended partition) and defines 5 partitions by selecting
    partition field ranges from the sampled documents.
 
@@ -196,10 +203,10 @@ You must specify this partitioner using the full classname:
 ``ShardedPartitioner`` Configuration
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The ``ShardedPartitioner`` automatically determines the partitions to use
+The ``ShardedPartitioner`` configuration automatically partitions the data
 based on your shard configuration.
 
-You must specify this partitioner using the full classname:
+To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.ShardedPartitioner``.
 
 .. warning::
@@ -212,7 +219,10 @@ You must specify this partitioner using the full classname:
 ``PaginateBySizePartitioner`` Configuration
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You must specify this partitioner using the full classname:
+The ``PaginateBySizePartitioner`` configuration paginates the data by using the
+average document size to split the collection into average-sized chunks.
+
+To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateBySizePartitioner``.
 
 .. list-table::
@@ -239,7 +249,10 @@ You must specify this partitioner using the full classname:
 ``PaginateIntoPartitionsPartitioner`` Configuration
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You must specify this partitioner using the full classname:
+The ``PaginateIntoPartitionsPartitioner`` configuration paginates the data by dividing
+the count of documents in the collection by the maximum number of allowable partitions.
+
+To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.PaginateIntoPartitionsPartitioner``.
 
 .. list-table::
@@ -264,9 +277,9 @@ You must specify this partitioner using the full classname:
 ``SinglePartitionPartitioner`` Configuration
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-You must specify this partitioner using the full classname:
-``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
+The ``SinglePartitionPartitioner`` configuration creates a single partition.
 
-This partitioner creates a single partition.
+To use this configuration, set the ``partitioner`` configuration option to
+``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
 
 .. include:: /includes/connection-read-config.rst
\ No newline at end of file

From bd292c50ee0ac63b7259581ea0740d7b8086de2e Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Wed, 18 Oct 2023 13:32:11 -0500
Subject: [PATCH 27/65] stream read config

---
 source/includes/connection-read-config.rst      |  3 ++-
 source/streaming-mode/streaming-read-config.txt | 15 ++++++++++-----
 2 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index 61be8fcc..721d16ff 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -14,12 +14,13 @@ The following code examples show how to specify ``connection.uri``,
    spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
    spark.mongodb.read.database=test
    spark.mongodb.read.collection=myCollection
+   spark.mongodb.read.readPreference.name=primaryPreferred
 
 - In ``connection.uri``:
 
 .. code:: cfg
 
-  spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection
+  spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred
 
 .. important:: connection.uri Takes Precedence
 
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index ee0edba7..f1c2c7af 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -81,6 +81,12 @@ You can configure the following properties when reading data from MongoDB in str
        |
        | **Default:** ``true``
 
+   * - ``change.stream.``
+     - | Change stream configuration prefix.
+       | See the
+         :ref:`Change Stream Configuration <partitioner-conf>` section for more
+         information about change streams.
+
    * - ``outputExtendedJson``
      - | When ``true``, the connector converts BSON types not supported by Spark into 
          extended JSON strings.
@@ -91,13 +97,12 @@ You can configure the following properties when reading data from MongoDB in str
 
 .. _spark-change-stream-conf:
 
-Change Streams
---------------
+Change Stream Configuration
+---------------------------
 
-.. note::
+You can configure the following properties when reading a change stream from MongoDB:
 
-   If you use ``SparkConf`` to set the connector's change stream
-   configurations, prefix ``spark.mongodb.`` to each property.
+.. include:: /includes/conf-read-prefix.rst
 
 .. list-table::
    :header-rows: 1

From 8197a85b55f41ddf09b24ae5879ad9f6d79da4eb Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Wed, 18 Oct 2023 16:01:53 -0500
Subject: [PATCH 28/65] stream write

---
 source/batch-mode/batch-write.txt         |  5 +-
 source/streaming-mode/streaming-read.txt  | 81 +++++++-------------
 source/streaming-mode/streaming-write.txt | 92 +++++++++++++++++------
 3 files changed, 97 insertions(+), 81 deletions(-)

diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 89456e5e..c787e425 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -1,6 +1,3 @@
-.. _write-to-mongodb:
-.. _scala-write:
-.. _java-write:
 .. _batch-write-to-mongodb:
 
 ================
@@ -8,7 +5,7 @@ Write to MongoDB
 ================
 
 .. toctree::
-   :caption: Read Configuration Options
+   :caption: Write Configuration Options
 
    /batch-mode/batch-write-config
 
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index a41a84e0..6a754897 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -27,13 +27,6 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
 
 .. include:: /includes/fact-read-from-change-stream
 
-.. note::
-
-    Since Structured Streaming produces a single partition, it ignores
-    :ref:`partitioner configurations <partitioner-conf>`. Partitioner
-    configuration only apply when there are multiple partitions. This is true
-    for both micro-batch processing and continuous processing streams.
-
 .. tabs-drivers::
 
    tabs:
@@ -55,22 +48,15 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
             * - ``readStream.format()``
               - The format to use for read stream data. Use ``mongodb``.
          
-            * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink. 
-                
-                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-                as an argument, where ``<time value>`` is how often the Spark Connector 
-                should asynchronously checkpoint. If you 
-                pass any other static method of the ``Trigger`` class, or if you don't 
-                call ``writeStream.trigger()``, the Spark connector will use 
-                micro-batch processing instead. 
-  
-                To view a list of all supported processing policies, see `the Java 
-                trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
-
-                .. include:: /includes/note-trigger-method
-
+            * - ``readStream.option()``
+              - Use the ``option`` method to specify your MongoDB 
+                deployment :manual:`connection string </reference/connection-string/>` with the 
+                ``spark.mongodb.connection.uri`` option key.
+         
+                You can also use the ``option()`` method to configure other stream settings, 
+                including the MongoDB database and collection, destination 
+                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+            
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
@@ -124,22 +110,16 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
          
             * - ``readStream.format()``
               - The format to use for read stream data. Use ``mongodb``.
+ 
+            * - ``readStream.option()``
+              - Use the ``option`` method to specify your MongoDB 
+                deployment :manual:`connection string </reference/connection-string/>` with the 
+                ``spark.mongodb.connection.uri`` option key.
          
-            * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink. 
-
-                To use continuous processing, pass the method a time value 
-                using the ``continuous`` parameter.
-                If you pass any other named parameter, or if you don't 
-                call ``writeStream.trigger()``, the Spark Connector will use 
-                micro-batch processing instead. 
-                
-                To view a list of all supported processing policies, see 
-                `the pyspark trigger documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.trigger.html>`__.
-
-                .. include:: /includes/note-trigger-method
-
+                You can also use the ``option()`` method to configure other stream settings, 
+                including the MongoDB database and collection, destination 
+                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+        
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
@@ -187,23 +167,16 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
          
             * - ``readStream.format()``
               - The format to use for read stream data. Use ``mongodb``.
+ 
+            * - ``readStream.option()``
+              - Use the ``option`` method to specify your MongoDB 
+                deployment :manual:`connection string </reference/connection-string/>` with the 
+                ``spark.mongodb.connection.uri`` option key.
          
-            * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink.
-
-                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-                as an argument, where ``<time value>`` is how often the Spark Connector 
-                should asynchronously checkpoint. If you 
-                pass any other static method of the ``Trigger`` class, or if you don't 
-                call ``writeStream.trigger()``, the Spark connector will use 
-                micro-batch processing instead. 
-                
-                To view a list of all 
-                supported processing policies, see `the Scala trigger documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#trigger(trigger:org.apache.spark.sql.streaming.Trigger):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
-
-                .. include:: /includes/note-trigger-method
-
+                You can also use the ``option()`` method to configure other stream settings, 
+                including the MongoDB database and collection, destination 
+                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+        
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index 916e4c4f..1845f5da 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -1,7 +1,4 @@
 .. _streaming-write-to-mongodb:
-.. _streaming-scala-write:
-.. _streaming-java-write:
-.. _write-structured-stream:
 
 ================
 Write to MongoDB
@@ -50,7 +47,22 @@ Write to MongoDB
               - Specifies how data of a streaming DataFrame/Dataset is 
                 written to a streaming sink. To view a list of all 
                 supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
-         
+ 
+            * - ``writeStream.trigger()``
+              - Specifies how often results should be written to the streaming sink. 
+                
+                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
+                as an argument, where ``<time value>`` is how often the Spark Connector 
+                should asynchronously checkpoint. If you 
+                pass any other static method of the ``Trigger`` class, or if you don't 
+                call ``writeStream.trigger()``, the Spark connector will use 
+                micro-batch processing instead. 
+  
+                To view a list of all supported processing policies, see `the Java 
+                trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
+
+                .. include:: /includes/note-trigger-method
+        
          The following code snippet shows how to use the preceding 
          configuration settings to stream data to MongoDB:
 
@@ -84,23 +96,39 @@ Write to MongoDB
               - Description
          
             * - ``writeStream.format()``
-              - The format to use for write stream data. Use 
-                ``mongodb``.
+              - Specifies the underlying output data source. Use ``mongodb`` to write
+                to MongoDB.
          
             * - ``writeStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+              - Use the ``option`` method to configure stream settings, including the
+                MongoDB deployment
+                :manual:`connection string </reference/connection-string/>`,
+                MongoDB database and collection, destination 
+                directory, and
+                `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+
+                For a list of write stream configuration options, see
+                the :ref:`spark-streaming-write-conf` guide.
 
             * - ``writeStream.outputMode()``
               - Specifies how data of a streaming DataFrame is 
                 written to a streaming sink. To view a list of all 
                 supported output modes, see `the pyspark outputMode documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__.
 
+            * - ``writeStream.trigger()``
+              - Specifies how often results should be 
+                written to the streaming sink. 
+
+                To use continuous processing, pass the method a time value 
+                using the ``continuous`` parameter.
+                If you pass any other named parameter, or if you don't 
+                call ``writeStream.trigger()``, the Spark Connector will use 
+                micro-batch processing instead. 
+                
+                To view a list of all supported processing policies, see 
+                `the pyspark trigger documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.trigger.html>`__.
+
+                .. include:: /includes/note-trigger-method
          
          The following code snippet shows how to use the preceding 
          configuration settings to stream data to MongoDB:
@@ -150,7 +178,23 @@ Write to MongoDB
               - Specifies how data of a streaming DataFrame/Dataset is 
                 written to a streaming sink. To view a list of all 
                 supported output modes, see `the Scala outputMode documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
-         
+ 
+            * - ``writeStream.trigger()``
+              - Specifies how often results should be 
+                written to the streaming sink.
+
+                To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
+                as an argument, where ``<time value>`` is how often the Spark Connector 
+                should asynchronously checkpoint. If you 
+                pass any other static method of the ``Trigger`` class, or if you don't 
+                call ``writeStream.trigger()``, the Spark connector will use 
+                micro-batch processing instead. 
+                
+                To view a list of all 
+                supported processing policies, see `the Scala trigger documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#trigger(trigger:org.apache.spark.sql.streaming.Trigger):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
+
+                .. include:: /includes/note-trigger-method
+        
          The following code snippet shows how to use the preceding 
          configuration settings to stream data to MongoDB:
 
@@ -167,16 +211,11 @@ Write to MongoDB
          For a complete list of methods, see the 
          `Scala Structured Streaming reference <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
 
-Examples
---------
-
-The following example shows Spark Structured Streaming configurations 
-for streaming to MongoDB.
-
-Stream to MongoDB from a CSV File
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Example
+-------
 
-To stream data from a CSV file to MongoDB:
+The following example shows how to stream data from a :abbr:`CSV (comma-separated values)`
+file to MongoDB:
 
 .. tabs-drivers::
 
@@ -331,3 +370,10 @@ To stream data from a CSV file to MongoDB:
 
             // run the query
             val query = dataStreamWriter.start()
+
+DataStreamWriter API Documentation
+----------------------------------
+
+- `PySpark <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html#pyspark.sql.streaming.DataStreamWriter>`__
+- `Java <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+- `Scala <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
\ No newline at end of file

From 4ca9053380b711cf6c4bbd6ad4b0074921ec2c1a Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Wed, 18 Oct 2023 16:31:27 -0500
Subject: [PATCH 29/65] streaming mode

---
 source/streaming-mode/streaming-read.txt  | 95 +++++++++++++----------
 source/streaming-mode/streaming-write.txt | 45 +++++------
 2 files changed, 76 insertions(+), 64 deletions(-)

diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index 6a754897..b00002af 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -46,17 +46,21 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
               - Description
          
             * - ``readStream.format()``
-              - The format to use for read stream data. Use ``mongodb``.
+              - Specifies the format of the underlying input data source. Use ``mongodb``
+                to read from MongoDB.
          
             * - ``readStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+              - Use the ``option`` method to configure stream settings, including the
+                MongoDB deployment
+                :manual:`connection string </reference/connection-string/>`,
+                MongoDB database and collection, and aggregation pipeline stages.
+
+                For a list of read stream configuration options, see
+                the :ref:`spark-streaming-read-conf` guide.
             
+            * - ``readStream.schema()``
+              - Specifies the input schema.
+
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
@@ -109,17 +113,21 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
               - Description
          
             * - ``readStream.format()``
-              - The format to use for read stream data. Use ``mongodb``.
- 
+              - Specifies the format of the underlying input data source. Use ``mongodb``
+                to read from MongoDB.
+
             * - ``readStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+              - Use the ``option`` method to configure stream settings, including the
+                MongoDB deployment
+                :manual:`connection string </reference/connection-string/>`,
+                MongoDB database and collection, and aggregation pipeline stages.
+
+                For a list of read stream configuration options, see
+                the :ref:`spark-streaming-read-conf` guide.
         
+            * - ``readStream.schema()``
+              - Specifies the input schema.
+
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
@@ -161,22 +169,26 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
             :header-rows: 1
             :stub-columns: 1
             :widths: 10 40
-         
+
             * - Setting
               - Description
-         
+
             * - ``readStream.format()``
-              - The format to use for read stream data. Use ``mongodb``.
- 
+              - Specifies the format of the underlying input data source. Use ``mongodb``
+                to read from MongoDB.
+
             * - ``readStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+              - Use the ``option`` method to configure stream settings, including the
+                MongoDB deployment
+                :manual:`connection string </reference/connection-string/>`,
+                MongoDB database and collection, and aggregation pipeline stages.
+
+                For a list of read stream configuration options, see
+                the :ref:`spark-streaming-read-conf` guide.
         
+            * - ``readStream.schema()``
+              - Specifies the input schema.
+
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
@@ -208,16 +220,10 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
          For a complete list of methods, see the 
          `Scala Structured Streaming reference <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__.
 
-Examples
---------
+Example
+-------
 
-The following example shows Spark Structured Streaming configurations 
-for streaming from MongoDB.
-
-Stream to your Console from MongoDB
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-To stream data from MongoDB to your console:
+The following example shows how to stream data from MongoDB to your console.
 
 .. tabs-drivers::
 
@@ -395,16 +401,21 @@ To stream data from MongoDB to your console:
             // run the query
             val query = dataStreamWriter.start()
 
-//todo
-
 .. important:: Inferring the Schema of a Change Stream
 
    When the {+connector-short+} infers the schema of a data frame 
    read from a change stream, by default,
-   it will use the schema of the underlying collection rather than that
+   it uses the schema of the underlying collection rather than that
    of the change stream. If you set the ``change.stream.publish.full.document.only``
    option to ``true``, the connector uses the schema of the 
    change stream instead.
 
-   For more information on configuring a read operation, see the
-   :ref:`spark-change-stream-conf` section of the Read Configuration Options guide.
+   For a list of change stream configuration options, see the
+   :ref:`Read Configuration Options <spark-change-stream-conf>` guide.
+
+DataStreamReader API Documentation
+----------------------------------
+
+- `PySpark <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html#pyspark.sql.streaming.DataStreamReader>`__
+- `Java <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__
+- `Scala <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index 1845f5da..dbf41dfa 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -31,18 +31,19 @@ Write to MongoDB
               - Description
          
             * - ``writeStream.format()``
-              - The format to use for write stream data. Use 
-                ``mongodb``.
+              - Specifies the format of the underlying output data source. Use ``mongodb``
+                to write to MongoDB.
          
             * - ``writeStream.option()``
-              - Use the ``option()`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
+              - Use the ``option`` method to configure stream settings, including the
+                MongoDB deployment
+                :manual:`connection string </reference/connection-string/>`,
+                MongoDB database and collection, and
+                `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+
+                For a list of write stream configuration options, see
+                the :ref:`spark-streaming-write-conf` guide.
 
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
-         
             * - ``writeStream.outputMode()``
               - Specifies how data of a streaming DataFrame/Dataset is 
                 written to a streaming sink. To view a list of all 
@@ -96,15 +97,14 @@ Write to MongoDB
               - Description
          
             * - ``writeStream.format()``
-              - Specifies the underlying output data source. Use ``mongodb`` to write
-                to MongoDB.
+              - Specifies the format of the underlying output data source. Use ``mongodb``
+                to write to MongoDB.
          
             * - ``writeStream.option()``
               - Use the ``option`` method to configure stream settings, including the
                 MongoDB deployment
                 :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, destination 
-                directory, and
+                MongoDB database and collection, and
                 `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
 
                 For a list of write stream configuration options, see
@@ -162,17 +162,18 @@ Write to MongoDB
               - Description
          
             * - ``writeStream.format()``
-              - The format to use for write stream data. Use 
-                ``mongodb``.
+              - Specifies the format of the underlying output data source. Use ``mongodb``
+                to write to MongoDB.
          
             * - ``writeStream.option()``
-              - Use the ``option`` method to specify your MongoDB 
-                deployment :manual:`connection string </reference/connection-string/>` with the 
-                ``spark.mongodb.connection.uri`` option key.
-         
-                You can also use the ``option()`` method to configure other stream settings, 
-                including the MongoDB database and collection, destination 
-                directory, and `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+              - Use the ``option`` method to configure stream settings, including the
+                MongoDB deployment
+                :manual:`connection string </reference/connection-string/>`,
+                MongoDB database and collection, and
+                `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+
+                For a list of write stream configuration options, see
+                the :ref:`spark-streaming-write-conf` guide.
 
             * - ``writeStream.outputMode()``
               - Specifies how data of a streaming DataFrame/Dataset is 

From c056fd321b1bd3eea0ead0d850f8cbe6b5e07f02 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 08:59:44 -0500
Subject: [PATCH 30/65] java batch writes

---
 source/includes/save-modes-tip.rst |  9 +++++++
 source/java/write-to-mongodb.txt   | 43 +++++++++++++++++++++++-------
 2 files changed, 42 insertions(+), 10 deletions(-)
 create mode 100644 source/includes/save-modes-tip.rst

diff --git a/source/includes/save-modes-tip.rst b/source/includes/save-modes-tip.rst
new file mode 100644
index 00000000..415dc4a8
--- /dev/null
+++ b/source/includes/save-modes-tip.rst
@@ -0,0 +1,9 @@
+.. tip:: Save Modes
+   
+   The {+connector-long+} supports the following save modes:
+
+   -  ``append``
+   - ``overwrite``
+
+   To learn more about save modes, see the
+   `Spark SQL Guide <https://spark.apache.org/docs/3.2.0/sql-data-sources-load-save-functions.html#save-modes>`__.
diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index 7a8b4bbe..6657d9a4 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -1,16 +1,39 @@
-The following example creates a DataFrame from a ``json`` file and 
-saves it to the MongoDB collection specified in ``SparkConf``:
+The ``dataFrame.write()`` method returns a
+`DataFrameWriter <https://spark.apache.org/docs/latest/api/java/>`__ object.
+You can use this object to specify the format and other configuration settings for your
+batch write operation. 
 
-.. code-block:: java
+You must specify the following configuration settings to write to MongoDB:
+         
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``dataFrame.write.format()``
+     - Specifies the format of the underlying output data source. Use ``mongodb``
+       to write to MongoDB.
+         
+   * - ``dataFrame.write.option()``
+     - Use the ``option`` method to configure batch write settings, including the
+       MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and
+       destination directory.
 
-   Dataset<Row> df = spark.read().format("json").load("example.json");
+       For a list of batch write configuration options, see
+       the :ref:`spark-batch-write-conf` guide.
 
-   df.write().format("mongodb").mode("overwrite").save();
+The following example creates a DataFrame from a ``json`` file and 
+saves it to the MongoDB database and collection specified in ``SparkConf``:
+
+.. code-block:: java
 
-The MongoDB Connector for Spark supports the following save modes:
+   Dataset<Row> dataFrame = spark.read().format("json").load("example.json");
 
--  ``append``
-- ``overwrite``
+   dataFrame.write().format("mongodb").mode("overwrite").save();
 
-To learn more about save modes, see the `Spark SQL Guide <https://spark.apache.org/docs/3.2.0/sql-data-sources-load-save-functions.html#save-modes>`__.
-   
\ No newline at end of file
+.. include:: /includes/save-modes-tip.rst
\ No newline at end of file

From 8a9d61df6a13a3f807e9abd9d6cb70ec5ab997aa Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 09:27:59 -0500
Subject: [PATCH 31/65] batch write languages

---
 source/java/write-to-mongodb.txt   |  14 ++--
 source/python/write-to-mongodb.txt | 107 +++++++++++------------------
 source/scala/write-to-mongodb.txt  |  44 +++++++++---
 3 files changed, 85 insertions(+), 80 deletions(-)

diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index 6657d9a4..b480077a 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -1,6 +1,7 @@
-The ``dataFrame.write()`` method returns a
-`DataFrameWriter <https://spark.apache.org/docs/latest/api/java/>`__ object.
-You can use this object to specify the format and other configuration settings for your
+To write data to MongoDB, call the ``write()`` method on your
+DataFrame object. This method returns a
+`DataFrameWriter <https://spark.apache.org/docs/latest/api/java>`__
+object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 
 You must specify the following configuration settings to write to MongoDB:
@@ -32,8 +33,11 @@ saves it to the MongoDB database and collection specified in ``SparkConf``:
 
 .. code-block:: java
 
-   Dataset<Row> dataFrame = spark.read().format("json").load("example.json");
+   Dataset<Row> dataFrame = spark.read().format("json")
+                                        .load("example.json");
 
-   dataFrame.write().format("mongodb").mode("overwrite").save();
+   dataFrame.write().format("mongodb")
+                    .mode("overwrite")
+                    .save();
 
 .. include:: /includes/save-modes-tip.rst
\ No newline at end of file
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index fbb83e2a..8ca80e7e 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -1,73 +1,46 @@
-To create a DataFrame, first create a :ref:`SparkSession object
-<python-basics>`, then use the object's ``createDataFrame()`` function.
-In the following example, ``createDataFrame()`` takes
-a list of tuples containing names and ages, and a list of column names:
+To write data to MongoDB, call the ``write()`` function on your
+DataFrame object. This function returns a
+`DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.html#pyspark.sql.DataFrameWriter/>`__
+object, which you can use to specify the format and other configuration settings for your
+batch write operation. 
+
+You must specify the following configuration settings to write to MongoDB:
+         
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``dataFrame.write.format()``
+     - Specifies the format of the underlying output data source. Use ``mongodb``
+       to write to MongoDB.
+         
+   * - ``dataFrame.write.option()``
+     - Use the ``option`` method to configure batch write settings, including the
+       MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and
+       destination directory.
+
+       For a list of batch write configuration options, see
+       the :ref:`spark-batch-write-conf` guide.
+
+The following code example creates a DataFrame from a list of tuples containing names
+and ages and a list of column names. The example then writes this DataFrame to the
+``people.contacts`` collection in MongoDB.
 
 .. code-block:: python
 
-   people = spark.createDataFrame([("Bilbo Baggins",  50), ("Gandalf", 1000), ("Thorin", 195), ("Balin", 178), ("Kili", 77),
+   dataFrame = spark.createDataFrame([("Bilbo Baggins",  50), ("Gandalf", 1000), ("Thorin", 195), ("Balin", 178), ("Kili", 77),
       ("Dwalin", 169), ("Oin", 167), ("Gloin", 158), ("Fili", 82), ("Bombur", None)], ["name", "age"])
 
-Write the ``people`` DataFrame to the MongoDB database and collection
-specified in the :ref:`spark.mongodb.write.connection.uri<pyspark-shell>` option
-by using the ``write`` method:
+   dataFrame.write.format("mongodb")
+                  .mode("append")
+                  .option("database", "people")
+                  .option("collection", "contacts")
+                  .save()
 
-.. code-block:: python
-
-   people.write.format("mongodb").mode("append").save()
-
-The above operation writes to the MongoDB database and collection
-specified in the :ref:`spark.mongodb.write.connection.uri<pyspark-shell>` option
-when you connect to the ``pyspark`` shell.
-
-To read the contents of the DataFrame, use the ``show()`` method.
-
-.. code-block:: python
-
-   people.show()
-
-In the ``pyspark`` shell, the operation prints the following output:
-
-.. code-block:: none
-
-   +-------------+----+
-   |         name| age|
-   +-------------+----+
-   |Bilbo Baggins|  50|
-   |      Gandalf|1000|
-   |       Thorin| 195|
-   |        Balin| 178|
-   |         Kili|  77|
-   |       Dwalin| 169|
-   |          Oin| 167|
-   |        Gloin| 158|
-   |         Fili|  82|
-   |       Bombur|null|
-   +-------------+----+
-
-The ``printSchema()`` method prints out the DataFrame's schema:
-
-.. code-block:: python
-
-   people.printSchema()
-
-In the ``pyspark`` shell, the operation prints the following output:
-
-.. code-block:: none
-
-   root
-    |-- _id: struct (nullable = true)
-    |    |-- oid: string (nullable = true)
-    |-- age: long (nullable = true)
-    |-- name: string (nullable = true)
-
-If you need to write to a different MongoDB collection,
-use the ``.option()`` method with ``.write()``.
-
-To write to a collection called ``contacts`` in a database called
-``people``, specify the collection and database with ``.option()``:
-
-.. code-block:: python
-
-   people.write.format("mongodb").mode("append").option("database",
-   "people").option("collection", "contacts").save()
+.. include:: /includes/save-modes-tip.rst
\ No newline at end of file
diff --git a/source/scala/write-to-mongodb.txt b/source/scala/write-to-mongodb.txt
index f5ad4670..4bef8151 100644
--- a/source/scala/write-to-mongodb.txt
+++ b/source/scala/write-to-mongodb.txt
@@ -1,15 +1,43 @@
+To write data to MongoDB, call the ``write()`` method on your
+DataFrame object. This method returns a
+`DataFrameWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html>`__
+object, which you can use to specify the format and other configuration settings for your
+batch write operation. 
+
+You must specify the following configuration settings to write to MongoDB:
+         
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``dataFrame.write.format()``
+     - Specifies the format of the underlying output data source. Use ``mongodb``
+       to write to MongoDB.
+         
+   * - ``dataFrame.write.option()``
+     - Use the ``option`` method to configure batch write settings, including the
+       MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and
+       destination directory.
+
+       For a list of batch write configuration options, see
+       the :ref:`spark-batch-write-conf` guide.
+
 The following example creates a DataFrame from a ``json`` file and 
 saves it to the MongoDB collection specified in ``SparkConf``:
 
 .. code-block:: scala
 
-   val df = spark.read.format("json").load("example.json")
-
-   df.write.format("mongodb").mode("overwrite").save()
-
-The MongoDB Connector for Spark supports the following save modes:
+   val dataFrame = spark.read.format("json")
+                             .load("example.json")
 
--  ``append``
-- ``overwrite``
+   dataFrame.write.format("mongodb")
+                  .mode("overwrite")
+                  .save()
 
-To learn more about save modes, see the `Spark SQL Guide <https://spark.apache.org/docs/3.2.0/sql-data-sources-load-save-functions.html#save-modes>`__.
+.. include:: /includes/save-modes-tip.rst
\ No newline at end of file

From 164565a3fe4065eb88cc8a8826409676aa206cc2 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 09:30:02 -0500
Subject: [PATCH 32/65] factor out table

---
 source/includes/batch-write-settings.rst | 23 +++++++++++++++++++++++
 source/java/write-to-mongodb.txt         | 24 +-----------------------
 source/python/write-to-mongodb.txt       | 24 +-----------------------
 3 files changed, 25 insertions(+), 46 deletions(-)
 create mode 100644 source/includes/batch-write-settings.rst

diff --git a/source/includes/batch-write-settings.rst b/source/includes/batch-write-settings.rst
new file mode 100644
index 00000000..d138f77d
--- /dev/null
+++ b/source/includes/batch-write-settings.rst
@@ -0,0 +1,23 @@
+You must specify the following configuration settings to write to MongoDB:
+         
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``dataFrame.write.format()``
+     - Specifies the format of the underlying output data source. Use ``mongodb``
+       to write to MongoDB.
+         
+   * - ``dataFrame.write.option()``
+     - Use the ``option`` method to configure batch write settings, including the
+       MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and
+       destination directory.
+
+       For a list of batch write configuration options, see
+       the :ref:`spark-batch-write-conf` guide.
diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index b480077a..71cfeb06 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -4,29 +4,7 @@ DataFrame object. This method returns a
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 
-You must specify the following configuration settings to write to MongoDB:
-         
-.. list-table::
-   :header-rows: 1
-   :stub-columns: 1
-   :widths: 10 40
-         
-   * - Setting
-     - Description
-         
-   * - ``dataFrame.write.format()``
-     - Specifies the format of the underlying output data source. Use ``mongodb``
-       to write to MongoDB.
-         
-   * - ``dataFrame.write.option()``
-     - Use the ``option`` method to configure batch write settings, including the
-       MongoDB deployment
-       :manual:`connection string </reference/connection-string/>`,
-       MongoDB database and collection, and
-       destination directory.
-
-       For a list of batch write configuration options, see
-       the :ref:`spark-batch-write-conf` guide.
+.. include:: /includes/batch-write-settings.rst
 
 The following example creates a DataFrame from a ``json`` file and 
 saves it to the MongoDB database and collection specified in ``SparkConf``:
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index 8ca80e7e..ec00e8df 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -4,29 +4,7 @@ DataFrame object. This function returns a
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 
-You must specify the following configuration settings to write to MongoDB:
-         
-.. list-table::
-   :header-rows: 1
-   :stub-columns: 1
-   :widths: 10 40
-         
-   * - Setting
-     - Description
-         
-   * - ``dataFrame.write.format()``
-     - Specifies the format of the underlying output data source. Use ``mongodb``
-       to write to MongoDB.
-         
-   * - ``dataFrame.write.option()``
-     - Use the ``option`` method to configure batch write settings, including the
-       MongoDB deployment
-       :manual:`connection string </reference/connection-string/>`,
-       MongoDB database and collection, and
-       destination directory.
-
-       For a list of batch write configuration options, see
-       the :ref:`spark-batch-write-conf` guide.
+.. include:: /includes/batch-write-settings.rst
 
 The following code example creates a DataFrame from a list of tuples containing names
 and ages and a list of column names. The example then writes this DataFrame to the

From 80cedb24e1359c5484ee06374e4656455957cd46 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 09:37:06 -0500
Subject: [PATCH 33/65] wip

---
 source/batch-mode/batch-write.txt         | 18 +++++++++++----
 source/includes/save-modes-tip.rst        |  9 --------
 source/java/write-to-mongodb.txt          |  4 +---
 source/python/write-to-mongodb.txt        |  4 +---
 source/scala/write-to-mongodb.txt         | 28 ++---------------------
 source/streaming-mode/streaming-write.txt | 25 ++++++++------------
 6 files changed, 28 insertions(+), 60 deletions(-)
 delete mode 100644 source/includes/save-modes-tip.rst

diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index c787e425..2fe45a5d 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -29,7 +29,12 @@ Write to MongoDB
 
          .. include:: /scala/write-to-mongodb.txt
 
-.. warning:: Setting the Write Mode to ``overwrite``
+.. warning:: Save Modes
+   
+   The {+connector-long+} supports the following save modes:
+
+   -  ``append``
+   - ``overwrite``
 
    If you specify the ``overwrite`` write mode, the connector drops the target
    collection and creates a new collection that uses the
@@ -38,13 +43,18 @@ Write to MongoDB
    such as the following collection types:
 
    - Sharded collections
-   - Collections with non-default collations
+   - Collections with nondefault collations
    - Time-series collections
 
+   To learn more about save modes, see the
+   `Spark SQL Guide <https://spark.apache.org/docs/3.2.0/sql-data-sources-load-save-functions.html#save-modes>`__.
+   
 .. important::
 
    If your write operation includes a field with a ``null`` value,
    the connector writes the field name and ``null`` value to MongoDB. You can
    change this behavior by setting the write configuration property
-   ``ignoreNullValues``. For more information about setting the connector's
-   write behavior, see :ref:`Write Configuration Options <spark-batch-write-conf>`.
+   ``ignoreNullValues``.
+   
+   For more information about setting the connector's
+   write behavior, see :ref:`Write Configuration Options <spark-batch-write-conf>`.
\ No newline at end of file
diff --git a/source/includes/save-modes-tip.rst b/source/includes/save-modes-tip.rst
deleted file mode 100644
index 415dc4a8..00000000
--- a/source/includes/save-modes-tip.rst
+++ /dev/null
@@ -1,9 +0,0 @@
-.. tip:: Save Modes
-   
-   The {+connector-long+} supports the following save modes:
-
-   -  ``append``
-   - ``overwrite``
-
-   To learn more about save modes, see the
-   `Spark SQL Guide <https://spark.apache.org/docs/3.2.0/sql-data-sources-load-save-functions.html#save-modes>`__.
diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index 71cfeb06..7b1cb30a 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -16,6 +16,4 @@ saves it to the MongoDB database and collection specified in ``SparkConf``:
 
    dataFrame.write().format("mongodb")
                     .mode("overwrite")
-                    .save();
-
-.. include:: /includes/save-modes-tip.rst
\ No newline at end of file
+                    .save();
\ No newline at end of file
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index ec00e8df..b45a3470 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -19,6 +19,4 @@ and ages and a list of column names. The example then writes this DataFrame to t
                   .mode("append")
                   .option("database", "people")
                   .option("collection", "contacts")
-                  .save()
-
-.. include:: /includes/save-modes-tip.rst
\ No newline at end of file
+                  .save()
\ No newline at end of file
diff --git a/source/scala/write-to-mongodb.txt b/source/scala/write-to-mongodb.txt
index 4bef8151..b1c2f7c8 100644
--- a/source/scala/write-to-mongodb.txt
+++ b/source/scala/write-to-mongodb.txt
@@ -4,29 +4,7 @@ DataFrame object. This method returns a
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 
-You must specify the following configuration settings to write to MongoDB:
-         
-.. list-table::
-   :header-rows: 1
-   :stub-columns: 1
-   :widths: 10 40
-         
-   * - Setting
-     - Description
-         
-   * - ``dataFrame.write.format()``
-     - Specifies the format of the underlying output data source. Use ``mongodb``
-       to write to MongoDB.
-         
-   * - ``dataFrame.write.option()``
-     - Use the ``option`` method to configure batch write settings, including the
-       MongoDB deployment
-       :manual:`connection string </reference/connection-string/>`,
-       MongoDB database and collection, and
-       destination directory.
-
-       For a list of batch write configuration options, see
-       the :ref:`spark-batch-write-conf` guide.
+.. include:: /includes/batch-write-settings.rst
 
 The following example creates a DataFrame from a ``json`` file and 
 saves it to the MongoDB collection specified in ``SparkConf``:
@@ -38,6 +16,4 @@ saves it to the MongoDB collection specified in ``SparkConf``:
 
    dataFrame.write.format("mongodb")
                   .mode("overwrite")
-                  .save()
-
-.. include:: /includes/save-modes-tip.rst
\ No newline at end of file
+                  .save()
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index dbf41dfa..e9f33535 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -19,8 +19,9 @@ Write to MongoDB
        content: |
 
          Specify write stream configuration settings on your streaming 
-         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. You must specify the following configuration 
-         settings to write to MongoDB:
+         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
+         
+         You must specify the following configuration settings to write to MongoDB:
          
          .. list-table::
             :header-rows: 1
@@ -84,9 +85,9 @@ Write to MongoDB
        content: |
 
          Specify write stream configuration settings on your streaming 
-         DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__. You 
-         must specify the following configuration settings to write 
-         to MongoDB:
+         DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__.
+         
+         You must specify the following configuration settings to write to MongoDB:
          
          .. list-table::
             :header-rows: 1
@@ -150,8 +151,9 @@ Write to MongoDB
        content: |
 
          Specify write stream configuration settings on your streaming 
-         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__. You must specify the following configuration 
-         settings to write to MongoDB:
+         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
+         
+         You must specify the following configuration settings to write to MongoDB:
          
          .. list-table::
             :header-rows: 1
@@ -370,11 +372,4 @@ file to MongoDB:
               .outputMode("append")
 
             // run the query
-            val query = dataStreamWriter.start()
-
-DataStreamWriter API Documentation
-----------------------------------
-
-- `PySpark <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html#pyspark.sql.streaming.DataStreamWriter>`__
-- `Java <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
-- `Scala <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
\ No newline at end of file
+            val query = dataStreamWriter.start()
\ No newline at end of file

From aba5ac7d121e43e2f9e539939a947db007904c46 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 10:04:34 -0500
Subject: [PATCH 34/65] fixes

---
 source/includes/extracts-command-line.yaml | 2 +-
 source/index.txt                           | 6 +++---
 source/streaming-mode.txt                  | 2 ++
 3 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/source/includes/extracts-command-line.yaml b/source/includes/extracts-command-line.yaml
index cb437c33..f0d4b8db 100644
--- a/source/includes/extracts-command-line.yaml
+++ b/source/includes/extracts-command-line.yaml
@@ -21,7 +21,7 @@ content: |
     MongoDB server address (``127.0.0.1``), the database to connect
     (``test``), and the collection (``myCollection``) from which to read
     data, and the read preference.
-  - The :ref:`spark.mongodb.write.connection.uri <spark-output-conf>` specifies the
+  - The ``spark.mongodb.write.connection.uri`` specifies the
     MongoDB server address (``127.0.0.1``), the database to connect
     (``test``), and the collection (``myCollection``) to which to write
     data. Connects to port ``27017`` by default.
diff --git a/source/index.txt b/source/index.txt
index 15a9a061..1525688c 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -8,11 +8,11 @@ integration between MongoDB and Apache Spark.
 
 .. note::
 
-   Version 10.x of the MongoDB Connector for Spark is an all-new 
+   Version 10.x of the {+connector-long+} is an all-new 
    connector based on the latest Spark API. Install and migrate to 
    version 10.x to take advantage of new capabilities, such as tighter 
    integration with 
-   :ref:`Spark Structured Streaming <spark-structured-streaming>`.
+   :ref:`Spark Structured Streaming <streaming-mode>`.
 
    Version 10.x uses the new namespace 
    ``com.mongodb.spark.sql.connector.MongoTableProvider``. 
@@ -27,7 +27,7 @@ MongoDB datasets: Datasets for analysis with SQL (benefiting from
 automatic schema inference), streaming, machine learning, and graph
 APIs. You can also use the connector with the Spark Shell.
 
-The MongoDB Connector for Spark is compatible with the following
+The {+connector-long+} is compatible with the following
 versions of Apache Spark and MongoDB:
 
 .. list-table::
diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
index 1bc8c6c2..ad5dfcca 100644
--- a/source/streaming-mode.txt
+++ b/source/streaming-mode.txt
@@ -1,3 +1,5 @@
+.. _streaming-mode:
+
 ==============
 Streaming Mode
 ==============

From bb03332d92877497ae232e719df5f1710f8ec8df Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 10:07:21 -0500
Subject: [PATCH 35/65] fix

---
 source/getting-started.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/source/getting-started.txt b/source/getting-started.txt
index 80dc525e..0985befb 100644
--- a/source/getting-started.txt
+++ b/source/getting-started.txt
@@ -47,6 +47,6 @@ Tutorials
 
 - :ref:`batch-write-to-mongodb`
 - :ref:`batch-read-from-mongodb`
-- :ref:`streaming-write-from-mongodb`
+- :ref:`streaming-write-to-mongodb`
 - :ref:`streaming-read-from-mongodb`
 

From 1c6f1dfb8dac6aea00442f75a7d9f08c343f2f44 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 14:02:38 -0500
Subject: [PATCH 36/65] api links

---
 source/configuration.txt | 40 ++++++++++++++++++++++------------------
 1 file changed, 22 insertions(+), 18 deletions(-)

diff --git a/source/configuration.txt b/source/configuration.txt
index 005185eb..c530c0d6 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -64,9 +64,16 @@ defaults.
 Using an Options Map
 ~~~~~~~~~~~~~~~~~~~~
 
-In the Spark API, the DataFrameReader and DataFrameWriter methods 
-accept options in the form of a ``Map[String, String]``. Options 
-specified this way override any corresponding settings in ``SparkConf``.
+In the Spark API, the DataFrameReader, DataFrameWriter, DataStreamReader,
+and DataStreamWriter classes each contain an ``option()`` method. You can use
+this method to specify options for the underlying read or write operation.
+
+.. note::
+   
+   Options specified in this way override any corresponding settings in ``SparkConf``.
+
+To learn more about the ``option()`` method, see the following Spark
+documentation pages:
 
 .. tabs-drivers::
 
@@ -74,29 +81,26 @@ specified this way override any corresponding settings in ``SparkConf``.
      - id: java-sync
        content: |
 
-         To learn more about specifying options with 
-         `DataFrameReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameReader.html#option-java.lang.String-boolean->`__ and 
-         `DataFrameWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameWriter.html#option-java.lang.String-boolean->`__, 
-         refer to the Java Spark documentation for the ``.option()`` 
-         method.
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameReader.html#option-java.lang.String-java.lang.String->`__
+         - `DataFrameWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameWriter.html#option-java.lang.String-java.lang.String->`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html#option-java.lang.String-java.lang.String->`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#option-java.lang.String-java.lang.String-->`__
 
      - id: python
        content: |
 
-         To learn more about specifying options with 
-         `DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/api/pyspark.sql.DataFrameReader.option.html#pyspark.sql.DataFrameReader.option>`__ and 
-         `DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/api/pyspark.sql.DataFrameWriter.option.html#pyspark.sql.DataFrameWriter.option>`__, 
-         refer to the Java Spark documentation for the ``.option()`` 
-         method.
+         `DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameReader.option.html>`__
+         `DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.option.html>`__
+         `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.option.html>`__
+         `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.option.html>`__
 
      - id: scala
        content: |
 
-         To learn more about specifying options with 
-         `DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameReader>`__ and 
-         `DataFrameWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameWriter[T]>`__, 
-         refer to the Java Spark documentation for the ``.option()`` 
-         method.
+         `DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameReader>`__
+         `DataFrameWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameWriter[T]>`__
+         `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html#option(key:String,value:Double):org.apache.spark.sql.streaming.DataStreamReader>`__
+         `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#option(key:String,value:Double):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__
   
 Short-Form Syntax
 `````````````````

From 113c446b9e712d1482640cba6fb3ff4f65213d23 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Thu, 19 Oct 2023 15:34:57 -0500
Subject: [PATCH 37/65] fixes

---
 source/batch-mode/batch-write-config.txt      |  2 +-
 source/configuration.txt                      | 48 +++++++++----------
 source/includes/connection-read-config.rst    | 15 +++---
 source/includes/connection-write-config.rst   | 20 ++++----
 .../streaming-mode/streaming-read-config.txt  |  8 ++--
 source/streaming-mode/streaming-read.txt      | 32 +++++--------
 6 files changed, 58 insertions(+), 67 deletions(-)

diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index de3a2482..1f3448c5 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -12,7 +12,7 @@ Write Configuration Options
 
 .. _spark-batch-output-conf:
 
-You can configure the following properties when writing data to MongoDB in batch mode:
+You can configure the following properties when writing data to MongoDB in batch mode.
 
 .. include:: /includes/conf-write-prefix.rst
 
diff --git a/source/configuration.txt b/source/configuration.txt
index c530c0d6..d244f6f9 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -72,6 +72,22 @@ this method to specify options for the underlying read or write operation.
    
    Options specified in this way override any corresponding settings in ``SparkConf``.
 
+Short-Form Syntax
+`````````````````
+
+Options maps support short-form syntax. You may omit the prefix when 
+specifying an option key string.
+
+.. example::
+
+   The following syntaxes are equivalent to one another:
+
+   - ``dfw.option("spark.mongodb.write.collection", "myCollection").save()``
+
+   - ``dfw.option("spark.mongodb.collection", "myCollection").save()``
+
+   - ``dfw.option("collection", "myCollection").save()``
+
 To learn more about the ``option()`` method, see the following Spark
 documentation pages:
 
@@ -89,35 +105,19 @@ documentation pages:
      - id: python
        content: |
 
-         `DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameReader.option.html>`__
-         `DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.option.html>`__
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.option.html>`__
-         `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.option.html>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameReader.option.html>`__
+         - `DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.option.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.option.html>`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.option.html>`__
 
      - id: scala
        content: |
 
-         `DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameReader>`__
-         `DataFrameWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameWriter[T]>`__
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html#option(key:String,value:Double):org.apache.spark.sql.streaming.DataStreamReader>`__
-         `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#option(key:String,value:Double):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameReader>`__
+         - `DataFrameWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html#option(key:String,value:Double):org.apache.spark.sql.DataFrameWriter[T]>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html#option(key:String,value:Double):org.apache.spark.sql.streaming.DataStreamReader>`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#option(key:String,value:Double):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__
   
-Short-Form Syntax
-`````````````````
-
-Options maps support short-form syntax. You may omit the prefix when 
-specifying an option key string.
-
-.. example::
-
-   The following syntaxes are equivalent to one another:
-
-   - ``dfw.option("spark.mongodb.write.collection", "myCollection").save()``
-
-   - ``dfw.option("spark.mongodb.collection", "myCollection").save()``
-
-   - ``dfw.option("collection", "myCollection").save()``
-
 Using a System Property
 ~~~~~~~~~~~~~~~~~~~~~~~
 
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index 721d16ff..60de1396 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -1,13 +1,12 @@
 Specifying Properties in ``connection.uri``
 -------------------------------------------
 
-If you're using ``SparkConf``, you can specify all the previous settings either
-individually or combined in the read ``connection.uri`` setting.
+If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
+can either list them individually or include them in the ``connection.uri`` setting.
 
-The following code examples show how to specify ``connection.uri``,
-``database``, and ``collection`` settings both separately and in ``connection.uri``:
-
-- Separately:
+The following code example shows how to specify the ``connection.uri``,
+``database``, ``collection``, and ``readPreference`` settings individually in a
+``SparkConf`` configuration file:
 
 .. code:: cfg
 
@@ -16,13 +15,13 @@ The following code examples show how to specify ``connection.uri``,
    spark.mongodb.read.collection=myCollection
    spark.mongodb.read.readPreference.name=primaryPreferred
 
-- In ``connection.uri``:
+Instead, you can specify these settings in the value of ``connection.uri``:
 
 .. code:: cfg
 
   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred
 
-.. important:: connection.uri Takes Precedence
+.. important::
 
    If you specify a setting in both the ``connection.uri`` and on its own line,
    the ``connection.uri`` setting takes precedence.
diff --git a/source/includes/connection-write-config.rst b/source/includes/connection-write-config.rst
index feefa7c6..3668d737 100644
--- a/source/includes/connection-write-config.rst
+++ b/source/includes/connection-write-config.rst
@@ -1,27 +1,27 @@
 Specifying Properties in ``connection.uri``
 -------------------------------------------
 
-If you're using ``SparkConf``, you can specify all the previous settings either
-individually or combined in the write ``connection.uri`` setting.
+If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
+can either list them individually or include them in the ``connection.uri`` setting.
 
-The following code examples show how to specify ``connection.uri``,
-``database``, and ``collection`` settings both separately and in ``connection.uri``:
-
-- Separately:
+The following code example shows how to specify the ``connection.uri``,
+``database``, ``collection``, and ``convertJson`` settings individually in a
+``SparkConf`` configuration file:
 
 .. code:: cfg
 
    spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
    spark.mongodb.write.database=test
    spark.mongodb.write.collection=myCollection
+   spark.mongodb.write.convertJson=any
 
-- In ``connection.uri``:
+Instead, you can specify these settings in the value of ``connection.uri``:
 
 .. code:: cfg
 
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection
+  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection?convertJson=any
 
-.. important:: connection.uri Takes Precedence
+.. important::
 
    If you specify a setting in both the ``connection.uri`` and on its own line,
    the ``connection.uri`` setting takes precedence.
@@ -31,4 +31,4 @@ The following code examples show how to specify ``connection.uri``,
    .. code:: cfg
 
       spark.mongodb.write.connection.uri=mongodb://127.0.0.1/foobar
-      spark.mongodb.write.database=bar
+      spark.mongodb.write.database=bar
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index f1c2c7af..a81efb94 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -45,7 +45,7 @@ You can configure the following properties when reading data from MongoDB in str
 
    * - ``mongoClientFactory``
      - | MongoClientFactory configuration key.
-       | You can specify a custom implementation which must implement the
+       | You can specify a custom implementation, which must implement the
          ``com.mongodb.spark.sql.connector.connection.MongoClientFactory``
          interface.
        |
@@ -84,7 +84,7 @@ You can configure the following properties when reading data from MongoDB in str
    * - ``change.stream.``
      - | Change stream configuration prefix.
        | See the
-         :ref:`Change Stream Configuration <partitioner-conf>` section for more
+         :ref:`Change Stream Configuration <change-stream-conf>` section for more
          information about change streams.
 
    * - ``outputExtendedJson``
@@ -95,15 +95,13 @@ You can configure the following properties when reading data from MongoDB in str
        |
        | **Default:** ``false``
 
-.. _spark-change-stream-conf:
+.. _change-stream-conf:
 
 Change Stream Configuration
 ---------------------------
 
 You can configure the following properties when reading a change stream from MongoDB:
 
-.. include:: /includes/conf-read-prefix.rst
-
 .. list-table::
    :header-rows: 1
    :widths: 35 65
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index b00002af..d1c44ab9 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -64,7 +64,9 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
-         writes checkpoints to ``/tmp/checkpointDir`` once per second:
+         writes checkpoints to ``/tmp/checkpointDir`` once per second. Passing the
+         ``Trigger.Continuous`` parameter to the ``trigger()`` method enables continuous
+         processing.
 
          .. code-block:: java
             :copyable: true
@@ -97,12 +99,6 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
 
          To read data from MongoDB, specify the following read-stream configuration settings on 
          `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__:  
-
-         To use continuous processing with the MongoDB Spark Connector, 
-         call the ``trigger()`` method on the ``writeStream`` property 
-         of the streaming DataFrame that you create from 
-         your MongoDB read stream. In your ``trigger()``, specify the 
-         ``continuous`` parameter.
          
          .. list-table::
             :header-rows: 1
@@ -131,7 +127,9 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
-         writes checkpoints to ``/tmp/checkpointDir`` once per second:
+         writes checkpoints to ``/tmp/checkpointDir`` once per second. Passing the
+         ``continuous`` parameter to the ``trigger()`` method enables continuous
+         processing.
 
          .. code-block:: python
             :copyable: true
@@ -192,7 +190,9 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
-         writes checkpoints to ``/tmp/checkpointDir`` once per second:
+         writes checkpoints to ``/tmp/checkpointDir`` once per second. Passing the
+         ``Trigger.Continuous`` parameter to the ``trigger()`` method enables continuous
+         processing.
 
          .. code-block:: scala
             :copyable: true
@@ -403,19 +403,13 @@ The following example shows how to stream data from MongoDB to your console.
 
 .. important:: Inferring the Schema of a Change Stream
 
-   When the {+connector-short+} infers the schema of a data frame 
+   When the {+connector-short+} infers the schema of a DataFrame
    read from a change stream, by default,
    it uses the schema of the underlying collection rather than that
    of the change stream. If you set the ``change.stream.publish.full.document.only``
    option to ``true``, the connector uses the schema of the 
    change stream instead.
 
-   For a list of change stream configuration options, see the
-   :ref:`Read Configuration Options <spark-change-stream-conf>` guide.
-
-DataStreamReader API Documentation
-----------------------------------
-
-- `PySpark <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html#pyspark.sql.streaming.DataStreamReader>`__
-- `Java <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__
-- `Scala <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__
\ No newline at end of file
+   For more information about this setting, and to see a full list of change stream
+   configuration options, see the
+   :ref:`Read Configuration Options <change-stream-conf>` guide.
\ No newline at end of file

From 47f0752e5d226b4df21a0614267c1a115d3d34b3 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 10:49:05 -0500
Subject: [PATCH 38/65] java batch read

---
 source/includes/batch-read-settings.rst | 23 ++++++++++++++++++
 source/java/read-from-mongodb.txt       | 31 ++++++++++++++-----------
 2 files changed, 41 insertions(+), 13 deletions(-)
 create mode 100644 source/includes/batch-read-settings.rst

diff --git a/source/includes/batch-read-settings.rst b/source/includes/batch-read-settings.rst
new file mode 100644
index 00000000..b5252527
--- /dev/null
+++ b/source/includes/batch-read-settings.rst
@@ -0,0 +1,23 @@
+You must specify the following configuration settings to read from MongoDB:
+         
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``dataFrame.read.format()``
+     - Specifies the format of the underlying input data source. Use ``mongodb``
+       to read from MongoDB.
+         
+   * - ``dataFrame.read.option()``
+     - Use the ``option`` method to configure batch read settings, including the
+       MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and
+       partitioner configuration.
+
+       For a list of batch read configuration options, see
+       the :ref:`spark-batch-read-conf` guide.
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index 43554e49..8a8aee34 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -1,24 +1,29 @@
-Use your local SparkSession's ``read`` method to create a DataFrame 
-representing a collection.
+To read data from MongoDB, call the ``read()`` method on your
+DataFrame object. This method returns a
+`DataFrameReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameReader.html>`__
+object, which you can use to specify the format and other configuration settings for your
+batch read operation. 
 
-.. note::
-   
-   ``DataFrame`` does not exist as a class in the Java API. Use 
-   ``Dataset<Row>`` to reference a DataFrame.
-
-The following example loads the collection specified in the
-``SparkConf``:
-
-.. code-block:: java
+.. include:: /includes/batch-read-settings.rst
 
-   Dataset<Row> df = spark.read().format("mongodb").load(); // Uses the SparkConf for configuration
+The following code snippet shows how to use the preceding 
+configuration settings to continuously process data streamed from MongoDB.
 
 To specify a different collection, database, and other read
 configuration settings, use the ``option`` method:
 
 .. code-block:: java
 
-   Dataset<Row> df = spark.read().format("mongodb").option("database", "<example-database>").option("collection", "<example-collection>").load();
+   Dataset<Row> df = spark.read()
+                          .format("mongodb")
+                          .option("database", "<example-database>")
+                          .option("collection", "<example-collection>")
+                          .load();
+
+.. tip:: DataFrame Type
+   
+   ``DataFrame`` doesn't exist as a class in the Java API. Use 
+   ``Dataset<Row>`` to reference a DataFrame.
 
 .. _java-implicit-schema:
 

From 4ee230aa2a1c9ed2fdeabaebda66a7efe496dbb3 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 11:58:31 -0500
Subject: [PATCH 39/65] java python reads

---
 source/batch-mode/batch-read.txt              |   2 -
 ...on.rst => contacts-example-collection.rst} |   0
 source/java/read-from-mongodb.txt             | 101 +++++++++++-------
 source/python/read-from-mongodb.txt           |  96 +++++++++++++----
 source/python/write-to-mongodb.txt            |   2 +-
 5 files changed, 136 insertions(+), 65 deletions(-)
 rename source/includes/{characters-example-collection.rst => contacts-example-collection.rst} (100%)

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 398a1d8b..049c9cc6 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -18,8 +18,6 @@ Read from MongoDB
 Overview
 --------
 
-.. tabs-selector:: drivers
-
 .. tabs-drivers::
 
    tabs:
diff --git a/source/includes/characters-example-collection.rst b/source/includes/contacts-example-collection.rst
similarity index 100%
rename from source/includes/characters-example-collection.rst
rename to source/includes/contacts-example-collection.rst
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index 8a8aee34..b0848891 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -6,18 +6,15 @@ batch read operation.
 
 .. include:: /includes/batch-read-settings.rst
 
-The following code snippet shows how to use the preceding 
-configuration settings to continuously process data streamed from MongoDB.
-
-To specify a different collection, database, and other read
-configuration settings, use the ``option`` method:
+The following code example shows how to use the previous
+configuration settings to read data from ``people.contacts`` in MongoDB:
 
 .. code-block:: java
 
-   Dataset<Row> df = spark.read()
+   Dataset<Row> dataFrame = spark.read()
                           .format("mongodb")
-                          .option("database", "<example-database>")
-                          .option("collection", "<example-collection>")
+                          .option("database", "people")
+                          .option("collection", "contacts")
                           .load();
 
 .. tip:: DataFrame Type
@@ -33,44 +30,68 @@ Schema Inference
 When you load a Dataset or DataFrame without a schema, Spark samples 
 the records to infer the schema of the collection.
 
-Consider a collection named ``characters``:
+Suppose that the MongoDB collection ``people.contacts`` contained the following documents:
 
-.. include:: /includes/characters-example-collection.rst
+.. include:: /includes/contacts-example-collection.rst
 
-The following operation loads data from the MongoDB collection 
-specified in ``SparkConf`` and infers the schema:
+The following operation loads data from ``people.contacts``
+and infers the schema of the DataFrame:
 
 .. code-block:: java
    
-   Dataset<Row> implicitDS = spark.read().format("mongodb").load();
-   implicitDS.printSchema();
-   implicitDS.show();
+   Dataset<Row> dataFrame = spark.read()
+                                 .format("mongodb")
+                                 .option("database", "people")
+                                 .option("collection", "contacts")
+                                 .load();
+
+To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
 
-``implicitDS.printSchema()`` outputs the following schema to the console:
+   .. input::
+      :language: java
 
-.. code-block:: sh
+      dataFrame.printSchema();
    
-   root
-    |-- _id: struct (nullable = true)
-    |    |-- oid: string (nullable = true)
-    |-- age: integer (nullable = true)
-    |-- name: string (nullable = true)
+   .. output::
+      :language: none
+      :visible: false
+
+      root
+       |-- _id: struct (nullable = true)
+       |    |-- oid: string (nullable = true)
+       |-- age: integer (nullable = true)
+       |-- name: string (nullable = true)
+ 
+To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: java
+
+      dataFrame.show();
    
-``implicitDS.show()`` outputs the following to the console:
-
-.. code-block:: sh
-
-   +--------------------+----+-------------+
-   |                 _id| age|         name|
-   +--------------------+----+-------------+
-   |[585024d558bef808...|  50|Bilbo Baggins|
-   |[585024d558bef808...|1000|      Gandalf|
-   |[585024d558bef808...| 195|       Thorin|
-   |[585024d558bef808...| 178|        Balin|
-   |[585024d558bef808...|  77|         Kíli|
-   |[585024d558bef808...| 169|       Dwalin|
-   |[585024d558bef808...| 167|          Óin|
-   |[585024d558bef808...| 158|        Glóin|
-   |[585024d558bef808...|  82|         Fíli|
-   |[585024d558bef808...|null|       Bombur|
-   +--------------------+----+-------------+
+   .. output::
+      :language: none
+      :visible: false
+
+      +--------------------+----+-------------+
+      |                 _id| age|         name|
+      +--------------------+----+-------------+
+      |[585024d558bef808...|  50|Bilbo Baggins|
+      |[585024d558bef808...|1000|      Gandalf|
+      |[585024d558bef808...| 195|       Thorin|
+      |[585024d558bef808...| 178|        Balin|
+      |[585024d558bef808...|  77|         Kíli|
+      |[585024d558bef808...| 169|       Dwalin|
+      |[585024d558bef808...| 167|          Óin|
+      |[585024d558bef808...| 158|        Glóin|
+      |[585024d558bef808...|  82|         Fíli|
+      |[585024d558bef808...|null|       Bombur|
+      +--------------------+----+-------------+
\ No newline at end of file
diff --git a/source/python/read-from-mongodb.txt b/source/python/read-from-mongodb.txt
index d0ce8b4d..5de191c7 100644
--- a/source/python/read-from-mongodb.txt
+++ b/source/python/read-from-mongodb.txt
@@ -1,38 +1,90 @@
-You can create a Spark DataFrame to hold data from the MongoDB
-collection specified in the
-:ref:`spark.mongodb.read.connection.uri <pyspark-shell>` option which your
-``SparkSession`` option is using.
+To read data from MongoDB, call the ``read`` function on your
+DataFrame object. This function returns a
+`DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameReader.html>`__
+object, which you can use to specify the format and other configuration settings for your
+batch read operation. 
 
-.. include:: /includes/example-load-dataframe.rst
+.. include:: /includes/batch-read-settings.rst
 
-Assign the collection to a DataFrame with ``spark.read()``
-from within the ``pyspark`` shell.
+The following code example shows how to use the previous
+configuration settings to read data from ``people.contacts`` in MongoDB:
 
 .. code-block:: python
 
-   df = spark.read.format("mongodb").load()
+   dataFrame = spark.read
+                    .format("mongodb")
+                    .option("database", "people")
+                    .option("collection", "contacts")
+                    .load()
 
-Spark samples the records to infer the schema of the collection.
+Schema Inference
+----------------
+
+When you load a Dataset or DataFrame without a schema, Spark samples 
+the records to infer the schema of the collection.
+
+Suppose that the MongoDB collection ``people.contacts`` contained the following documents:
+
+.. include:: /includes/contacts-example-collection.rst
+
+The following operation loads data from ``people.contacts``
+and infers the schema of the DataFrame:
 
 .. code-block:: python
+   
+   dataFrame = spark.read
+                    .format("mongodb")
+                    .option("database", "people")
+                    .option("collection", "contacts")
+                    .load()
 
-   df.printSchema()
+To see the inferred schema, use the ``dataFrame.printSchema()`` function, as shown in
+the following example:
 
-The above operation produces the following shell output:
+.. io-code-block::
+   :copyable: true
 
-.. code-block:: none
+   .. input::
+      :language: python
 
-   root
-    |-- _id: double (nullable = true)
-    |-- qty: double (nullable = true)
-    |-- type: string (nullable = true)
+      dataFrame.printSchema()
+   
+   .. output::
+      :language: none
+      :visible: false
 
-If you need to read from a different MongoDB collection,
-use the ``.option`` method when reading data into a DataFrame.
+      root
+       |-- _id: struct (nullable = true)
+       |    |-- oid: string (nullable = true)
+       |-- age: integer (nullable = true)
+       |-- name: string (nullable = true)
+ 
+To see the data in the DataFrame, use the ``dataFrame.show()`` function, as shown in
+the following example:
 
-To read from a collection called ``contacts`` in a database called
-``people``, specify ``people.contacts`` in the input URI option.
+.. io-code-block::
+   :copyable: true
 
-.. code-block:: python
+   .. input::
+      :language: python
+
+      dataFrame.show()
+   
+   .. output::
+      :language: none
+      :visible: false
 
-   df = spark.read.format("mongodb").option("uri", "mongodb://127.0.0.1/people.contacts").load()
+      +--------------------+----+-------------+
+      |                 _id| age|         name|
+      +--------------------+----+-------------+
+      |[585024d558bef808...|  50|Bilbo Baggins|
+      |[585024d558bef808...|1000|      Gandalf|
+      |[585024d558bef808...| 195|       Thorin|
+      |[585024d558bef808...| 178|        Balin|
+      |[585024d558bef808...|  77|         Kíli|
+      |[585024d558bef808...| 169|       Dwalin|
+      |[585024d558bef808...| 167|          Óin|
+      |[585024d558bef808...| 158|        Glóin|
+      |[585024d558bef808...|  82|         Fíli|
+      |[585024d558bef808...|null|       Bombur|
+      +--------------------+----+-------------+
\ No newline at end of file
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index b45a3470..f083e867 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -1,4 +1,4 @@
-To write data to MongoDB, call the ``write()`` function on your
+To write data to MongoDB, call the ``write`` function on your
 DataFrame object. This function returns a
 `DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.html#pyspark.sql.DataFrameWriter/>`__
 object, which you can use to specify the format and other configuration settings for your

From f1b5bc82658319fcc41ed6972d1258c5375ed68b Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 12:07:38 -0500
Subject: [PATCH 40/65] scala read

---
 source/scala/read-from-mongodb.txt | 104 +++++++++++++++++++++--------
 1 file changed, 75 insertions(+), 29 deletions(-)

diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index 52a15b1a..6ce8d02d 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -1,52 +1,98 @@
-Use your local SparkSession's ``read`` method to create a DataFrame 
-representing a collection.
+To read data from MongoDB, call the ``read`` method on your
+DataFrame object. This method returns a
+`DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html>`__
+object, which you can use to specify the format and other configuration settings for your
+batch read operation. 
 
-.. note::
-   
-   A ``DataFrame`` is represented by a ``Dataset`` of
-   ``Rows``. It is an alias of ``Dataset[Row]``.
+.. include:: /includes/batch-read-settings.rst
 
-The following example loads the collection specified in the
-``SparkConf``:
+The following code example shows how to use the previous
+configuration settings to read data from ``people.contacts`` in MongoDB:
 
 .. code-block:: scala
 
-   val df = spark.read.format("mongodb").load() // Uses the SparkConf for configuration
-
-To specify a different collection, database, and other read
-configuration settings, use the ``option`` method:
+   val dataFrame = spark.read
+                 .format("mongodb")
+                 .option("database", "people")
+                 .option("collection", "contacts")
+                 .load()
 
-.. code-block:: scala
-
-   val df = spark.read.format("mongodb").option("database", "<example-database>").option("collection", "<example-collection>").load()
+.. tip:: DataFrame Type
+   
+   A DataFrame is a Dataset of ``Row`` objects.
+   The ``DataFrame`` type is an alias for ``Dataset[Row]``.
 
 .. _scala-implicit-schema:
 
+
 Schema Inference
 ----------------
 
 When you load a Dataset or DataFrame without a schema, Spark samples 
 the records to infer the schema of the collection.
 
-Consider a collection named ``characters``:
+Suppose that the MongoDB collection ``people.contacts`` contained the following documents:
 
-.. include:: /includes/characters-example-collection.rst
+.. include:: /includes/contacts-example-collection.rst
 
-The following operation loads data from the MongoDB collection 
-specified in ``SparkConf`` and infers the schema:
+The following operation loads data from ``people.contacts``
+and infers the schema of the DataFrame:
 
 .. code-block:: scala
+   
+   val dataFrame = spark.read()
+                        .format("mongodb")
+                        .option("database", "people")
+                        .option("collection", "contacts")
+                        .load()
 
-   val df = MongoSpark.load(spark)  // Uses the SparkSession
-   df.printSchema()                 // Prints DataFrame schema
+To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
+the following example:
 
-``df.printSchema()`` outputs the following schema to the console:
+.. io-code-block::
+   :copyable: true
 
-.. code-block:: sh
+   .. input::
+      :language: scala
+
+      dataFrame.printSchema()
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      root
+       |-- _id: struct (nullable = true)
+       |    |-- oid: string (nullable = true)
+       |-- age: integer (nullable = true)
+       |-- name: string (nullable = true)
+ 
+To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: scala
+
+      dataFrame.show()
    
-   root
-    |-- _id: struct (nullable = true)
-    |    |-- oid: string (nullable = true)
-    |-- age: integer (nullable = true)
-    |-- name: string (nullable = true)
-   
\ No newline at end of file
+   .. output::
+      :language: none
+      :visible: false
+
+      +--------------------+----+-------------+
+      |                 _id| age|         name|
+      +--------------------+----+-------------+
+      |[585024d558bef808...|  50|Bilbo Baggins|
+      |[585024d558bef808...|1000|      Gandalf|
+      |[585024d558bef808...| 195|       Thorin|
+      |[585024d558bef808...| 178|        Balin|
+      |[585024d558bef808...|  77|         Kíli|
+      |[585024d558bef808...| 169|       Dwalin|
+      |[585024d558bef808...| 167|          Óin|
+      |[585024d558bef808...| 158|        Glóin|
+      |[585024d558bef808...|  82|         Fíli|
+      |[585024d558bef808...|null|       Bombur|
+      +--------------------+----+-------------+
\ No newline at end of file

From 3d3704d289da8981ba0492d3dd7d6db3a0419029 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 12:31:01 -0500
Subject: [PATCH 41/65] api links

---
 source/batch-mode/batch-read.txt    | 27 +++++++++++++++++++++++++++
 source/java/read-from-mongodb.txt   |  5 ++---
 source/python/read-from-mongodb.txt |  2 +-
 source/scala/read-from-mongodb.txt  |  1 -
 4 files changed, 30 insertions(+), 5 deletions(-)

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 049c9cc6..a1b20fcc 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -60,3 +60,30 @@ SQL Queries
        content: |
 
          .. include:: /scala/sql.txt
+  
+API Documentation
+-----------------
+
+To learn more about the types used in these examples, see the following Apache Spark
+API documentation:
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameReader.html>`__
+
+     - id: python
+       content: |
+
+         - `DataFrame <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/dataframe.html>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameReader.html>`__
+
+     - id: scala
+       content: |
+
+         - `Dataset[T] <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/Dataset.html>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html>`__
\ No newline at end of file
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index b0848891..3dfba027 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -1,8 +1,7 @@
 To read data from MongoDB, call the ``read()`` method on your
 DataFrame object. This method returns a
-`DataFrameReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameReader.html>`__
-object, which you can use to specify the format and other configuration settings for your
-batch read operation. 
+``DataFrameReader`` object, which you can use to specify the format and other
+configuration settings for your batch read operation. 
 
 .. include:: /includes/batch-read-settings.rst
 
diff --git a/source/python/read-from-mongodb.txt b/source/python/read-from-mongodb.txt
index 5de191c7..2eb1f3db 100644
--- a/source/python/read-from-mongodb.txt
+++ b/source/python/read-from-mongodb.txt
@@ -1,6 +1,6 @@
 To read data from MongoDB, call the ``read`` function on your
 DataFrame object. This function returns a
-`DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameReader.html>`__
+``DataFrameReader``
 object, which you can use to specify the format and other configuration settings for your
 batch read operation. 
 
diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index 6ce8d02d..dfde20c7 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -24,7 +24,6 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
 
 .. _scala-implicit-schema:
 
-
 Schema Inference
 ----------------
 

From 7664a8691f5f088569f27f6aa734213ae648421f Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 12:32:26 -0500
Subject: [PATCH 42/65] remove driver dropdown

---
 source/batch-mode/batch-write.txt         | 2 --
 source/configuration.txt                  | 2 --
 source/getting-started.txt                | 2 --
 source/streaming-mode/streaming-write.txt | 2 --
 4 files changed, 8 deletions(-)

diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 2fe45a5d..8806f59b 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -9,8 +9,6 @@ Write to MongoDB
 
    /batch-mode/batch-write-config
 
-.. tabs-selector:: drivers
-
 .. tabs-drivers::
 
    tabs:
diff --git a/source/configuration.txt b/source/configuration.txt
index d244f6f9..0eeeb43d 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -30,8 +30,6 @@ Using ``SparkConf``
 You can specify configuration options with ``SparkConf`` using any of 
 the following approaches:
 
-.. tabs-selector:: drivers
-
 .. tabs-drivers::
 
    tabs:
diff --git a/source/getting-started.txt b/source/getting-started.txt
index 0985befb..1acfc3fe 100644
--- a/source/getting-started.txt
+++ b/source/getting-started.txt
@@ -22,8 +22,6 @@ Prerequisites
 Getting Started
 ---------------
 
-.. tabs-selector:: drivers
-
 .. tabs-drivers::
 
    tabs:
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index e9f33535..6aed8fdf 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -9,8 +9,6 @@ Write to MongoDB
 
    /streaming-mode/streaming-write-config
 
-.. tabs-selector:: drivers
-
 .. tabs-drivers::
 
    tabs:

From 41892a13ed0bcd89bc1abd0b40e077a2f14bc8ca Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 13:34:50 -0500
Subject: [PATCH 43/65] refactor inference intro

---
 ...ample-collection.rst => schema-inference-intro.rst} |  9 +++++++++
 source/java/read-from-mongodb.txt                      | 10 +---------
 source/python/read-from-mongodb.txt                    | 10 +---------
 source/scala/read-from-mongodb.txt                     | 10 +---------
 4 files changed, 12 insertions(+), 27 deletions(-)
 rename source/includes/{contacts-example-collection.rst => schema-inference-intro.rst} (73%)

diff --git a/source/includes/contacts-example-collection.rst b/source/includes/schema-inference-intro.rst
similarity index 73%
rename from source/includes/contacts-example-collection.rst
rename to source/includes/schema-inference-intro.rst
index 578a1732..24c5ca5e 100644
--- a/source/includes/contacts-example-collection.rst
+++ b/source/includes/schema-inference-intro.rst
@@ -1,3 +1,8 @@
+When you load a Dataset or DataFrame without a schema, Spark samples 
+the records to infer the schema of the collection.
+
+Suppose that the MongoDB collection ``people.contacts`` contains the following documents:
+
 .. code-block:: javascript
 
    { "_id" : ObjectId("585024d558bef808ed84fc3e"), "name" : "Bilbo Baggins", "age" : 50 }
@@ -10,3 +15,7 @@
    { "_id" : ObjectId("585024d558bef808ed84fc45"), "name" : "Glóin", "age" : 158 }
    { "_id" : ObjectId("585024d558bef808ed84fc46"), "name" : "Fíli", "age" : 82 }
    { "_id" : ObjectId("585024d558bef808ed84fc47"), "name" : "Bombur" }
+
+The following operation loads data from ``people.contacts``
+and infers the schema of the DataFrame:
+
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index 3dfba027..e47088de 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -26,15 +26,7 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
 Schema Inference
 ----------------
 
-When you load a Dataset or DataFrame without a schema, Spark samples 
-the records to infer the schema of the collection.
-
-Suppose that the MongoDB collection ``people.contacts`` contained the following documents:
-
-.. include:: /includes/contacts-example-collection.rst
-
-The following operation loads data from ``people.contacts``
-and infers the schema of the DataFrame:
+.. include:: /includes/schema-inference-intro.rst
 
 .. code-block:: java
    
diff --git a/source/python/read-from-mongodb.txt b/source/python/read-from-mongodb.txt
index 2eb1f3db..1870538f 100644
--- a/source/python/read-from-mongodb.txt
+++ b/source/python/read-from-mongodb.txt
@@ -20,15 +20,7 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
 Schema Inference
 ----------------
 
-When you load a Dataset or DataFrame without a schema, Spark samples 
-the records to infer the schema of the collection.
-
-Suppose that the MongoDB collection ``people.contacts`` contained the following documents:
-
-.. include:: /includes/contacts-example-collection.rst
-
-The following operation loads data from ``people.contacts``
-and infers the schema of the DataFrame:
+.. include:: /includes/schema-inference-intro.rst
 
 .. code-block:: python
    
diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index dfde20c7..4404d1cd 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -27,15 +27,7 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
 Schema Inference
 ----------------
 
-When you load a Dataset or DataFrame without a schema, Spark samples 
-the records to infer the schema of the collection.
-
-Suppose that the MongoDB collection ``people.contacts`` contained the following documents:
-
-.. include:: /includes/contacts-example-collection.rst
-
-The following operation loads data from ``people.contacts``
-and infers the schema of the DataFrame:
+.. include:: /includes/schema-inference-intro.rst
 
 .. code-block:: scala
    

From 2a6c88ad1c7a597138e556237d1f29f0dd5a777e Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 13:35:46 -0500
Subject: [PATCH 44/65] remove inline scala link

---
 source/scala/read-from-mongodb.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index 4404d1cd..895b24fc 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -1,6 +1,6 @@
 To read data from MongoDB, call the ``read`` method on your
 DataFrame object. This method returns a
-`DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameReader.html>`__
+``DataFrameReader``
 object, which you can use to specify the format and other configuration settings for your
 batch read operation. 
 

From 4304c141bbfca4f8f13d12f9e5bec86f3a10492f Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 13:45:13 -0500
Subject: [PATCH 45/65] batch write changes

---
 source/batch-mode/batch-write.txt      | 29 +++++++++++++++++++++++++-
 source/includes/java-dataframe-tip.rst |  4 ++++
 source/java/read-from-mongodb.txt      |  5 +----
 source/java/write-to-mongodb.txt       |  6 ++++--
 source/python/write-to-mongodb.txt     |  4 ++--
 source/scala/write-to-mongodb.txt      |  2 +-
 6 files changed, 40 insertions(+), 10 deletions(-)
 create mode 100644 source/includes/java-dataframe-tip.rst

diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 8806f59b..39bac347 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -55,4 +55,31 @@ Write to MongoDB
    ``ignoreNullValues``.
    
    For more information about setting the connector's
-   write behavior, see :ref:`Write Configuration Options <spark-batch-write-conf>`.
\ No newline at end of file
+   write behavior, see :ref:`Write Configuration Options <spark-batch-write-conf>`.
+   
+API Documentation
+-----------------
+
+To learn more about the types used in these examples, see the following Apache Spark
+API documentation:
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `DataFrameWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameWriter.html>`__
+
+     - id: python
+       content: |
+
+         - `DataFrame <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/dataframe.html>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.html>`__
+
+     - id: scala
+       content: |
+
+         - `Dataset[T] <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/Dataset.html>`__
+         - `DataFrameReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html>`__
\ No newline at end of file
diff --git a/source/includes/java-dataframe-tip.rst b/source/includes/java-dataframe-tip.rst
new file mode 100644
index 00000000..ce92ed3d
--- /dev/null
+++ b/source/includes/java-dataframe-tip.rst
@@ -0,0 +1,4 @@
+.. tip:: DataFrame Type
+   
+   ``DataFrame`` doesn't exist as a class in the Java API. Use 
+   ``Dataset<Row>`` to reference a DataFrame.
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index e47088de..5899400a 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -16,10 +16,7 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
                           .option("collection", "contacts")
                           .load();
 
-.. tip:: DataFrame Type
-   
-   ``DataFrame`` doesn't exist as a class in the Java API. Use 
-   ``Dataset<Row>`` to reference a DataFrame.
+.. include:: /includes/java-dataframe-tip.rst
 
 .. _java-implicit-schema:
 
diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index 7b1cb30a..27b3a48e 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -1,6 +1,6 @@
 To write data to MongoDB, call the ``write()`` method on your
 DataFrame object. This method returns a
-`DataFrameWriter <https://spark.apache.org/docs/latest/api/java>`__
+``DataFrameWriter``
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 
@@ -16,4 +16,6 @@ saves it to the MongoDB database and collection specified in ``SparkConf``:
 
    dataFrame.write().format("mongodb")
                     .mode("overwrite")
-                    .save();
\ No newline at end of file
+                    .save();
+
+.. include:: /includes/java-dataframe-tip.rst
\ No newline at end of file
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index f083e867..19a9c502 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -1,12 +1,12 @@
 To write data to MongoDB, call the ``write`` function on your
 DataFrame object. This function returns a
-`DataFrameWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.DataFrameWriter.html#pyspark.sql.DataFrameWriter/>`__
+``DataFrameWriter``
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 
 .. include:: /includes/batch-write-settings.rst
 
-The following code example creates a DataFrame from a list of tuples containing names
+The following example creates a DataFrame from a list of tuples containing names
 and ages and a list of column names. The example then writes this DataFrame to the
 ``people.contacts`` collection in MongoDB.
 
diff --git a/source/scala/write-to-mongodb.txt b/source/scala/write-to-mongodb.txt
index b1c2f7c8..ce35cee6 100644
--- a/source/scala/write-to-mongodb.txt
+++ b/source/scala/write-to-mongodb.txt
@@ -1,6 +1,6 @@
 To write data to MongoDB, call the ``write()`` method on your
 DataFrame object. This method returns a
-`DataFrameWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/DataFrameWriter.html>`__
+``DataFrameWriter``
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
 

From 45ad35e7d156849cf719a3bba98b372f93fd51b2 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 14:11:10 -0500
Subject: [PATCH 46/65] stream read api docs

---
 source/includes/stream-read-settings.rst |  22 ++++
 source/streaming-mode/streaming-read.txt | 153 +++++++++--------------
 2 files changed, 82 insertions(+), 93 deletions(-)
 create mode 100644 source/includes/stream-read-settings.rst

diff --git a/source/includes/stream-read-settings.rst b/source/includes/stream-read-settings.rst
new file mode 100644
index 00000000..6dd69bc2
--- /dev/null
+++ b/source/includes/stream-read-settings.rst
@@ -0,0 +1,22 @@
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``readStream.format()``
+     - Specifies the format of the underlying input data source. Use ``mongodb``
+       to read from MongoDB.
+
+   * - ``readStream.option()``
+     - Specifies stream settings, including the MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and aggregation pipeline stages.
+
+       For a list of read stream configuration options, see
+       the :ref:`spark-streaming-read-conf` guide.
+        
+   * - ``readStream.schema()``
+     - Specifies the input schema.
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index d1c44ab9..86e9d319 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -34,32 +34,12 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
      - id: java-sync
        content: |
 
-         To read data from MongoDB, specify the following read-stream configuration settings on 
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__: 
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``readStream.format()``
-              - Specifies the format of the underlying input data source. Use ``mongodb``
-                to read from MongoDB.
-         
-            * - ``readStream.option()``
-              - Use the ``option`` method to configure stream settings, including the
-                MongoDB deployment
-                :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, and aggregation pipeline stages.
-
-                For a list of read stream configuration options, see
-                the :ref:`spark-streaming-read-conf` guide.
-            
-            * - ``readStream.schema()``
-              - Specifies the input schema.
+         To read data from MongoDB, call the ``read()`` method on your
+         DataFrame object. This method returns a
+         ``DataStreamReader`` object, which you can use to specify the format and other
+         configuration settings for your streaming read operation. 
+
+         .. include:: /includes/stream-read-settings.rst 
 
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
@@ -97,33 +77,14 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
      - id: python
        content: |
 
-         To read data from MongoDB, specify the following read-stream configuration settings on 
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__:  
-         
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-         
-            * - Setting
-              - Description
-         
-            * - ``readStream.format()``
-              - Specifies the format of the underlying input data source. Use ``mongodb``
-                to read from MongoDB.
-
-            * - ``readStream.option()``
-              - Use the ``option`` method to configure stream settings, including the
-                MongoDB deployment
-                :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, and aggregation pipeline stages.
-
-                For a list of read stream configuration options, see
-                the :ref:`spark-streaming-read-conf` guide.
-        
-            * - ``readStream.schema()``
-              - Specifies the input schema.
+         To read data from MongoDB, call the ``read`` function on your
+         DataFrame object. This function returns a
+         ``DataStreamReader``
+         object, which you can use to specify the format and other configuration settings for your
+         streaming read operation. 
 
+         .. include:: /includes/stream-read-settings.rst
+         
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
          The connector appends all new data to the existing data and asynchronously 
@@ -160,32 +121,13 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
      - id: scala
        content: |
          
-         To read data from MongoDB, specify the following read-stream configuration settings on 
-         `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__:  
-
-         .. list-table::
-            :header-rows: 1
-            :stub-columns: 1
-            :widths: 10 40
-
-            * - Setting
-              - Description
-
-            * - ``readStream.format()``
-              - Specifies the format of the underlying input data source. Use ``mongodb``
-                to read from MongoDB.
+         To read data from MongoDB, call the ``read`` method on your
+         DataFrame object. This method returns a
+         ``DataStreamReader``
+         object, which you can use to specify the format and other configuration settings for your
+         streaming read operation. 
 
-            * - ``readStream.option()``
-              - Use the ``option`` method to configure stream settings, including the
-                MongoDB deployment
-                :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, and aggregation pipeline stages.
-
-                For a list of read stream configuration options, see
-                the :ref:`spark-streaming-read-conf` guide.
-        
-            * - ``readStream.schema()``
-              - Specifies the input schema.
+         .. include:: /includes/stream-read-settings.rst
 
          The following code snippet shows how to use the preceding 
          configuration settings to continuously process data streamed from MongoDB.
@@ -232,12 +174,10 @@ The following example shows how to stream data from MongoDB to your console.
      - id: java-sync
        content: |
 
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from MongoDB.
+         1. Create a ``DataStreamReader`` object that reads from MongoDB.
 
          #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+            ``DataStreamWriter`` object
             by calling the ``writeStream()`` method on the streaming 
             Dataset or streaming DataFrame that you created with a 
             ``DataStreamReader``. Specify the format ``console`` using 
@@ -247,9 +187,9 @@ The following example shows how to stream data from MongoDB to your console.
             instance to begin the stream.
 
          As new data is inserted into MongoDB, MongoDB streams that 
-         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__ 
+         data out to your console according to the ``outputMode``
          you specify.
-
+         
          .. include:: /includes/warn-console-stream.txt
 
          .. code-block:: java
@@ -289,12 +229,10 @@ The following example shows how to stream data from MongoDB to your console.
      - id: python
        content: |
 
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__ 
-            that reads from MongoDB.
+         1. Create a ``DataStreamReader`` object that reads from MongoDB.
 
          #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
+            ``DataStreamWriter`` object
             by calling the ``writeStream()`` method on the streaming 
             DataFrame that you created with a ``DataStreamReader``. 
             Specify the format ``console`` using the ``format()`` method.
@@ -303,7 +241,7 @@ The following example shows how to stream data from MongoDB to your console.
             instance to begin the stream.
          
          As new data is inserted into MongoDB, MongoDB streams that 
-         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__ 
+         data out to your console according to the ``outputMode``
          you specify.
 
          .. include:: /includes/warn-console-stream.txt
@@ -348,11 +286,10 @@ The following example shows how to stream data from MongoDB to your console.
        content: |
 
          1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from MongoDB.
+            ``DataStreamReader`` object that reads from MongoDB.
 
          #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+            ``DataStreamWriter`` object
             by calling the ``writeStream()`` method on the streaming 
             Dataset or streaming DataFrame that you created with a 
             ``DataStreamReader``. Specify the format ``console`` using 
@@ -362,7 +299,7 @@ The following example shows how to stream data from MongoDB to your console.
             instance to begin the stream.
          
          As new data is inserted into MongoDB, MongoDB streams that 
-         data out to your console using the `outputMode <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__ 
+         data out to your console according to the ``outputMode``
          you specify.
 
          .. include:: /includes/warn-console-stream.txt
@@ -412,4 +349,34 @@ The following example shows how to stream data from MongoDB to your console.
 
    For more information about this setting, and to see a full list of change stream
    configuration options, see the
-   :ref:`Read Configuration Options <change-stream-conf>` guide.
\ No newline at end of file
+   :ref:`Read Configuration Options <change-stream-conf>` guide.
+
+API Documentation
+-----------------
+
+To learn more about the types used in these examples, see the following Apache Spark
+API documentation:
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+     
+     - id: python
+       content: |
+
+         - `DataFrame <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/dataframe.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
+     
+     - id: scala
+       content: |
+
+         - `Dataset[T] <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/Dataset.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
\ No newline at end of file

From 9d1178f629400f1a6c692691db0ee5821f274e8f Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 14:46:44 -0500
Subject: [PATCH 47/65] streaming write

---
 source/includes/stream-read-settings.rst  |   2 +
 source/includes/stream-write-settings.rst |  54 +++++++
 source/streaming-mode/streaming-read.txt  |  12 +-
 source/streaming-mode/streaming-write.txt | 188 ++++++++++++----------
 4 files changed, 166 insertions(+), 90 deletions(-)
 create mode 100644 source/includes/stream-write-settings.rst

diff --git a/source/includes/stream-read-settings.rst b/source/includes/stream-read-settings.rst
index 6dd69bc2..162772b5 100644
--- a/source/includes/stream-read-settings.rst
+++ b/source/includes/stream-read-settings.rst
@@ -1,3 +1,5 @@
+You must specify the following configuration settings to read from MongoDB:
+
 .. list-table::
    :header-rows: 1
    :stub-columns: 1
diff --git a/source/includes/stream-write-settings.rst b/source/includes/stream-write-settings.rst
new file mode 100644
index 00000000..bbad11a5
--- /dev/null
+++ b/source/includes/stream-write-settings.rst
@@ -0,0 +1,54 @@
+You must specify the following configuration settings to write to MongoDB:
+         
+.. list-table::
+   :header-rows: 1
+   :stub-columns: 1
+   :widths: 10 40
+         
+   * - Setting
+     - Description
+         
+   * - ``writeStream.format()``
+     - Specifies the format of the underlying output data source. Use ``mongodb``
+       to write to MongoDB.
+         
+   * - ``writeStream.option()``
+     - Specifies stream settings, including the
+       MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and checkpoint directory.
+
+       For a list of write stream configuration options, see
+       the :ref:`spark-streaming-write-conf` guide.
+
+   * - ``writeStream.outputMode()``
+     - Specifies how data of a streaming DataFrame is 
+       written to a streaming sink. To view a list of all 
+       supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
+ 
+   * - ``writeStream.trigger()``
+     - Specifies how often results should be written to the streaming sink. 
+                
+       To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
+       as an argument, where ``<time value>`` is how often the Spark Connector 
+       should asynchronously checkpoint. If you 
+       pass any other static method of the ``Trigger`` class, or if you don't 
+       call ``writeStream.trigger()``, the Spark connector will use 
+       micro-batch processing instead. 
+  
+       To view a list of all supported processing policies, see `the Java 
+       trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
+
+       .. include:: /includes/note-trigger-method
+
+
+   * - ``readStream.option()``
+     - Specifies stream settings, including the MongoDB deployment
+       :manual:`connection string </reference/connection-string/>`,
+       MongoDB database and collection, and aggregation pipeline stages.
+
+       For a list of read stream configuration options, see
+       the :ref:`spark-streaming-read-conf` guide.
+        
+   * - ``readStream.schema()``
+     - Specifies the input schema.
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index 86e9d319..b8badfdb 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -34,8 +34,8 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
      - id: java-sync
        content: |
 
-         To read data from MongoDB, call the ``read()`` method on your
-         DataFrame object. This method returns a
+         To read data from MongoDB, call the ``readStream()`` method on your
+         ``SparkSession`` object. This method returns a
          ``DataStreamReader`` object, which you can use to specify the format and other
          configuration settings for your streaming read operation. 
 
@@ -77,8 +77,8 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
      - id: python
        content: |
 
-         To read data from MongoDB, call the ``read`` function on your
-         DataFrame object. This function returns a
+         To read data from MongoDB, call the ``readStream`` function on your
+         ``SparkSession`` object. This function returns a
          ``DataStreamReader``
          object, which you can use to specify the format and other configuration settings for your
          streaming read operation. 
@@ -121,8 +121,8 @@ more about continuous processing, see the `Spark documentation <https://spark.ap
      - id: scala
        content: |
          
-         To read data from MongoDB, call the ``read`` method on your
-         DataFrame object. This method returns a
+         To read data from MongoDB, call the ``readStream`` method on your
+         ``SparkSession`` object. This method returns a
          ``DataStreamReader``
          object, which you can use to specify the format and other configuration settings for your
          streaming read operation. 
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index 6aed8fdf..ae779ec2 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -16,9 +16,12 @@ Write to MongoDB
      - id: java-sync
        content: |
 
-         Specify write stream configuration settings on your streaming 
-         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
-         
+        To write data to MongoDB, call the ``writeStream()`` method on your
+        DataFrame object. This method returns a
+        ``DataStreamWriter``
+        object, which you can use to specify the format and other configuration settings
+        for your streaming write operation. 
+
          You must specify the following configuration settings to write to MongoDB:
          
          .. list-table::
@@ -34,42 +37,41 @@ Write to MongoDB
                 to write to MongoDB.
          
             * - ``writeStream.option()``
-              - Use the ``option`` method to configure stream settings, including the
-                MongoDB deployment
+              - Specifies stream settings, including the MongoDB deployment
                 :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, and
-                `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+                MongoDB database and collection, and checkpoint directory.
 
                 For a list of write stream configuration options, see
                 the :ref:`spark-streaming-write-conf` guide.
 
             * - ``writeStream.outputMode()``
-              - Specifies how data of a streaming DataFrame/Dataset is 
+              - Specifies how data of a streaming DataFrame is 
                 written to a streaming sink. To view a list of all 
                 supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
  
             * - ``writeStream.trigger()``
-              - Specifies how often results should be written to the streaming sink. 
+              - Specifies how often the {+connector-short+} writes results
+                to the streaming sink. 
                 
                 To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
                 as an argument, where ``<time value>`` is how often the Spark Connector 
                 should asynchronously checkpoint. If you 
                 pass any other static method of the ``Trigger`` class, or if you don't 
-                call ``writeStream.trigger()``, the Spark connector will use 
+                call ``writeStream.trigger()``, the Spark connector uses 
                 micro-batch processing instead. 
   
-                To view a list of all supported processing policies, see `the Java 
+                To view a list of all supported processing policies, see the `Java 
                 trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
 
                 .. include:: /includes/note-trigger-method
         
-         The following code snippet shows how to use the preceding 
+         The following code snippet shows how to use the previous 
          configuration settings to stream data to MongoDB:
 
          .. code-block:: java
             :copyable: true
          
-            <streaming Dataset/DataFrame>.writeStream()
+            <streaming DataFrame>.writeStream()
               .format("mongodb")
               .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
               .option("spark.mongodb.database", <database-name>)
@@ -82,11 +84,14 @@ Write to MongoDB
      - id: python
        content: |
 
-         Specify write stream configuration settings on your streaming 
-         DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__.
-         
+        To write data to MongoDB, call the ``writeStream`` function on your
+        DataFrame object. This function returns a
+        ``DataStreamWriter``
+        object, which you can use to specify the format and other configuration settings for your
+        streaming write operation. 
+
          You must specify the following configuration settings to write to MongoDB:
-         
+
          .. list-table::
             :header-rows: 1
             :stub-columns: 1
@@ -100,28 +105,26 @@ Write to MongoDB
                 to write to MongoDB.
          
             * - ``writeStream.option()``
-              - Use the ``option`` method to configure stream settings, including the
-                MongoDB deployment
+              - Specifies stream settings, including the MongoDB deployment
                 :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, and
-                `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+                MongoDB database and collection, and checkpoint directory.
 
                 For a list of write stream configuration options, see
                 the :ref:`spark-streaming-write-conf` guide.
 
             * - ``writeStream.outputMode()``
-              - Specifies how data of a streaming DataFrame is 
-                written to a streaming sink. To view a list of all 
-                supported output modes, see `the pyspark outputMode documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__.
+              - Specifies how the {+connector-short+} writes a streaming DataFrame
+                to a streaming sink. To view a list of all 
+                supported output modes, see the `pyspark outputMode documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__.
 
             * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink. 
+              - Specifies how often the {+connector-short+} writes results
+                to the streaming sink. 
 
-                To use continuous processing, pass the method a time value 
+                To use continuous processing, pass the function a time value 
                 using the ``continuous`` parameter.
                 If you pass any other named parameter, or if you don't 
-                call ``writeStream.trigger()``, the Spark Connector will use 
+                call ``writeStream.trigger()``, the {+connector-short+} uses
                 micro-batch processing instead. 
                 
                 To view a list of all supported processing policies, see 
@@ -129,7 +132,7 @@ Write to MongoDB
 
                 .. include:: /includes/note-trigger-method
          
-         The following code snippet shows how to use the preceding 
+         The following code snippet shows how to use the previous 
          configuration settings to stream data to MongoDB:
 
          .. code-block:: python
@@ -142,17 +145,20 @@ Write to MongoDB
               .option("spark.mongodb.collection", <collection-name>) \
               .outputMode("append")
          
-         For a complete list of methods, see the 
+         For a complete list of functions, see the 
          `pyspark Structured Streaming reference <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__.
 
      - id: scala
        content: |
 
-         Specify write stream configuration settings on your streaming 
-         Dataset or streaming DataFrame using `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__.
-         
+        To write data to MongoDB, call the ``write`` method on your
+        DataFrame object. This method returns a
+        ``DataStreamWriter``
+        object, which you can use to specify the format and other configuration settings
+        for your streaming write operation. 
+
          You must specify the following configuration settings to write to MongoDB:
-         
+
          .. list-table::
             :header-rows: 1
             :stub-columns: 1
@@ -166,29 +172,27 @@ Write to MongoDB
                 to write to MongoDB.
          
             * - ``writeStream.option()``
-              - Use the ``option`` method to configure stream settings, including the
-                MongoDB deployment
+              - Specifies stream settings, including the MongoDB deployment
                 :manual:`connection string </reference/connection-string/>`,
-                MongoDB database and collection, and
-                `checkpoint directory <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#recovering-from-failures-with-checkpointing>`__.
+                MongoDB database and collection, and checkpoint directory.
 
                 For a list of write stream configuration options, see
                 the :ref:`spark-streaming-write-conf` guide.
 
             * - ``writeStream.outputMode()``
-              - Specifies how data of a streaming DataFrame/Dataset is 
-                written to a streaming sink. To view a list of all 
-                supported output modes, see `the Scala outputMode documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
+              - Specifies how the {+connector-short+} writes a streaming DataFrame
+                to a streaming sink. To view a list of all supported output modes, see
+                `Scala outputMode documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
  
             * - ``writeStream.trigger()``
-              - Specifies how often results should be 
-                written to the streaming sink.
+              - Specifies how often the {+connector-short+} writes results
+                to the streaming sink.
 
                 To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
                 as an argument, where ``<time value>`` is how often the Spark Connector 
                 should asynchronously checkpoint. If you 
                 pass any other static method of the ``Trigger`` class, or if you don't 
-                call ``writeStream.trigger()``, the Spark connector will use 
+                call ``writeStream.trigger()``, the Spark connector uses
                 micro-batch processing instead. 
                 
                 To view a list of all 
@@ -196,13 +200,13 @@ Write to MongoDB
 
                 .. include:: /includes/note-trigger-method
         
-         The following code snippet shows how to use the preceding 
+         The following code snippet shows how to use the previous 
          configuration settings to stream data to MongoDB:
 
          .. code-block:: scala
             :copyable: true
          
-            <streaming Dataset/DataFrame>.writeStream
+            <streaming DataFrame>.writeStream
               .format("mongodb")
               .option("spark.mongodb.connection.uri", <mongodb-connection-string>)
               .option("spark.mongodb.database", <database-name>)
@@ -225,23 +229,18 @@ file to MongoDB:
      - id: java-sync
        content: |
 
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from the CSV file.
+         1. Create a ``DataStreamReader`` object that reads from the CSV file.
 
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__ 
-            by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``mongodb`` using 
-            the ``format()`` method.
+         #. To create a ``DataStreamWriter`` object, call the ``writeStream()`` method
+            on the streaming DataFrame that you created with the
+            ``DataStreamReader``. Use the ``format()`` method to specify ``mongodb`` as
+            the underlying data format.
 
          #. Call the ``start()`` method on the ``DataStreamWriter``
-            instance to begin the stream.
+            object to begin the stream.
          
          As the connector reads data from the CSV file, it adds that 
-         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__ 
-         you specify.
+         data to MongoDB according to the ``outputMode`` you specify.
 
          .. code-block:: java
             :copyable: true
@@ -275,23 +274,19 @@ file to MongoDB:
      - id: python
        content: |
 
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__ 
-            that reads from the CSV file.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            DataFrame that you created with a ``DataStreamReader``. 
-            Specify the format ``mongodb`` using the ``format()`` method.
+         1. Create a ``DataStreamReader`` object that reads from the CSV file.
 
-         #. Call the ``start()`` method on the ``DataStreamWriter``
+         #. To create a ``DataStreamWriter`` object, call the ``writeStream`` function
+            on the streaming DataFrame that you created with the
+            ``DataStreamReader``. Use the ``format()`` function to specify ``mongodb`` as
+            the underlying data format.
+         
+         #. Call the ``start()`` function on the ``DataStreamWriter``
             instance to begin the stream.
          
          As the connector reads data from the CSV file, it adds that 
-         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.outputMode.html#pyspark.sql.streaming.DataStreamWriter.outputMode>`__ 
-         you specify.
-
+         data to MongoDB according to the ``outputMode`` you specify.
+         
          .. code-block:: python
             :copyable: true
 
@@ -325,23 +320,18 @@ file to MongoDB:
      - id: scala
        content: |
 
-         1. Create a 
-            `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
-            that reads from the CSV file.
-
-         #. Create a 
-            `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
-            by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``mongodb`` using 
-            the ``format()`` method.
+         1. Create a ``DataStreamReader`` object that reads from the CSV file.
 
+         #. To create a ``DataStreamWriter`` object, call the ``writeStream`` method
+            on the streaming DataFrame that you created with the
+            ``DataStreamReader``. Use the ``format()`` method to specify ``mongodb`` as
+            the underlying data format.
+         
          #. Call the ``start()`` method on the ``DataStreamWriter``
             instance to begin the stream.
          
          As the connector reads data from the CSV file, it adds that 
-         data to MongoDB using the `outputMode <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode(outputMode:String):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__ 
-         you specify.
+         data to MongoDB according to the ``outputMode`` you specify.
 
          .. code-block:: scala
             :copyable: true
@@ -370,4 +360,34 @@ file to MongoDB:
               .outputMode("append")
 
             // run the query
-            val query = dataStreamWriter.start()
\ No newline at end of file
+            val query = dataStreamWriter.start()
+
+API Documentation
+-----------------
+
+To learn more about the types used in these examples, see the following Apache Spark
+API documentation:
+
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
+     
+     - id: python
+       content: |
+
+         - `DataFrame <https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/dataframe.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamReader.html>`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.html>`__
+     
+     - id: scala
+       content: |
+
+         - `Dataset[T] <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/Dataset.html>`__
+         - `DataStreamReader <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamReader.html>`__
+         - `DataStreamWriter <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
\ No newline at end of file

From 609942e82746150cdbbb993eb5b209d37c6d1802 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 14:47:34 -0500
Subject: [PATCH 48/65] remove write settings

---
 source/includes/stream-write-settings.rst | 54 -----------------------
 1 file changed, 54 deletions(-)
 delete mode 100644 source/includes/stream-write-settings.rst

diff --git a/source/includes/stream-write-settings.rst b/source/includes/stream-write-settings.rst
deleted file mode 100644
index bbad11a5..00000000
--- a/source/includes/stream-write-settings.rst
+++ /dev/null
@@ -1,54 +0,0 @@
-You must specify the following configuration settings to write to MongoDB:
-         
-.. list-table::
-   :header-rows: 1
-   :stub-columns: 1
-   :widths: 10 40
-         
-   * - Setting
-     - Description
-         
-   * - ``writeStream.format()``
-     - Specifies the format of the underlying output data source. Use ``mongodb``
-       to write to MongoDB.
-         
-   * - ``writeStream.option()``
-     - Specifies stream settings, including the
-       MongoDB deployment
-       :manual:`connection string </reference/connection-string/>`,
-       MongoDB database and collection, and checkpoint directory.
-
-       For a list of write stream configuration options, see
-       the :ref:`spark-streaming-write-conf` guide.
-
-   * - ``writeStream.outputMode()``
-     - Specifies how data of a streaming DataFrame is 
-       written to a streaming sink. To view a list of all 
-       supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
- 
-   * - ``writeStream.trigger()``
-     - Specifies how often results should be written to the streaming sink. 
-                
-       To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-       as an argument, where ``<time value>`` is how often the Spark Connector 
-       should asynchronously checkpoint. If you 
-       pass any other static method of the ``Trigger`` class, or if you don't 
-       call ``writeStream.trigger()``, the Spark connector will use 
-       micro-batch processing instead. 
-  
-       To view a list of all supported processing policies, see `the Java 
-       trigger documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/Trigger.html>`__.
-
-       .. include:: /includes/note-trigger-method
-
-
-   * - ``readStream.option()``
-     - Specifies stream settings, including the MongoDB deployment
-       :manual:`connection string </reference/connection-string/>`,
-       MongoDB database and collection, and aggregation pipeline stages.
-
-       For a list of read stream configuration options, see
-       the :ref:`spark-streaming-read-conf` guide.
-        
-   * - ``readStream.schema()``
-     - Specifies the input schema.
\ No newline at end of file

From ef836d085c5ae0e4c08841f52bcf1fcf31c2db6e Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 14:48:17 -0500
Subject: [PATCH 49/65] fix link text

---
 source/streaming-mode/streaming-write.txt | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index ae779ec2..16726518 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -47,7 +47,7 @@ Write to MongoDB
             * - ``writeStream.outputMode()``
               - Specifies how data of a streaming DataFrame is 
                 written to a streaming sink. To view a list of all 
-                supported output modes, see `the Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
+                supported output modes, see the `Java outputMode documentation <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html#outputMode-java.lang.String->`__.
  
             * - ``writeStream.trigger()``
               - Specifies how often the {+connector-short+} writes results
@@ -128,7 +128,7 @@ Write to MongoDB
                 micro-batch processing instead. 
                 
                 To view a list of all supported processing policies, see 
-                `the pyspark trigger documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.trigger.html>`__.
+                the `pyspark trigger documentation <https://spark.apache.org/docs/latest/api/python/reference/pyspark.ss/api/pyspark.sql.streaming.DataStreamWriter.trigger.html>`__.
 
                 .. include:: /includes/note-trigger-method
          
@@ -196,7 +196,7 @@ Write to MongoDB
                 micro-batch processing instead. 
                 
                 To view a list of all 
-                supported processing policies, see `the Scala trigger documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#trigger(trigger:org.apache.spark.sql.streaming.Trigger):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
+                supported processing policies, see the `Scala trigger documentation <https://spark.apache.org/docs/latest/api/scala/org/apache/spark/sql/streaming/DataStreamWriter.html#trigger(trigger:org.apache.spark.sql.streaming.Trigger):org.apache.spark.sql.streaming.DataStreamWriter[T]>`__.
 
                 .. include:: /includes/note-trigger-method
         

From e33546b6e4893b148f15024e9d24865da5491942 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 15:27:35 -0500
Subject: [PATCH 50/65] fixes

---
 source/batch-mode/batch-read-config.txt       |  6 ++--
 source/batch-mode/batch-read.txt              |  2 +-
 source/batch-mode/batch-write-config.txt      |  6 ++--
 source/batch-mode/batch-write.txt             |  5 ++-
 source/java/write-to-mongodb.txt              |  4 ++-
 source/scala/write-to-mongodb.txt             |  4 ++-
 .../streaming-mode/streaming-read-config.txt  |  6 ++--
 source/streaming-mode/streaming-read.txt      |  2 +-
 .../streaming-mode/streaming-write-config.txt |  6 ++--
 source/streaming-mode/streaming-write.txt     | 32 +++++++++----------
 10 files changed, 40 insertions(+), 33 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index b8796f15..4ceaf3d5 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -1,8 +1,8 @@
 .. _spark-batch-read-conf:
 
-==========================
-Read Configuration Options
-==========================
+================================
+Batch Read Configuration Options
+================================
 
 .. contents:: On this page
    :local:
diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index a1b20fcc..2eb1889c 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -5,7 +5,7 @@ Read from MongoDB
 =================
 
 .. toctree::
-   :caption: Read Configuration Options
+   :caption: Batch Read Configuration Options
 
    /batch-mode/batch-read-config
 
diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index 1f3448c5..c135177f 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -1,8 +1,8 @@
 .. _spark-batch-write-conf:
 
-===========================
-Write Configuration Options
-===========================
+=================================
+Batch Write Configuration Options
+=================================
 
 .. contents:: On this page
    :local:
diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 39bac347..3e5b8cbc 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -5,10 +5,13 @@ Write to MongoDB
 ================
 
 .. toctree::
-   :caption: Write Configuration Options
+   :caption: Batch Write Configuration Options
 
    /batch-mode/batch-write-config
 
+Overview
+--------
+
 .. tabs-drivers::
 
    tabs:
diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index 27b3a48e..0b3b29df 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -7,7 +7,7 @@ batch write operation.
 .. include:: /includes/batch-write-settings.rst
 
 The following example creates a DataFrame from a ``json`` file and 
-saves it to the MongoDB database and collection specified in ``SparkConf``:
+saves it to the ``people.contacts`` collection in MongoDB:
 
 .. code-block:: java
 
@@ -16,6 +16,8 @@ saves it to the MongoDB database and collection specified in ``SparkConf``:
 
    dataFrame.write().format("mongodb")
                     .mode("overwrite")
+                    .option("database", "people")
+                    .option("collection", "contacts")
                     .save();
 
 .. include:: /includes/java-dataframe-tip.rst
\ No newline at end of file
diff --git a/source/scala/write-to-mongodb.txt b/source/scala/write-to-mongodb.txt
index ce35cee6..5af9c387 100644
--- a/source/scala/write-to-mongodb.txt
+++ b/source/scala/write-to-mongodb.txt
@@ -7,7 +7,7 @@ batch write operation.
 .. include:: /includes/batch-write-settings.rst
 
 The following example creates a DataFrame from a ``json`` file and 
-saves it to the MongoDB collection specified in ``SparkConf``:
+saves it to the ``people.contacts`` collection in MongoDB:
 
 .. code-block:: scala
 
@@ -16,4 +16,6 @@ saves it to the MongoDB collection specified in ``SparkConf``:
 
    dataFrame.write.format("mongodb")
                   .mode("overwrite")
+                  .option("database", "people")
+                  .option("collection", "contacts")
                   .save()
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index a81efb94..af5b0f1e 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -1,8 +1,8 @@
 .. _spark-streaming-read-conf:
 
-==========================
-Read Configuration Options
-==========================
+====================================
+Streaming Read Configuration Options
+====================================
 
 .. contents:: On this page
    :local:
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index b8badfdb..443a047e 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -5,7 +5,7 @@ Read from MongoDB
 =================
 
 .. toctree::
-   :caption: Read Configuration Options
+   :caption: Streaming Read Configuration Options
 
    /streaming-mode/streaming-read-config
 
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index bece6336..db8242f6 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -1,8 +1,8 @@
 .. _spark-streaming-write-conf:
 
-===========================
-Write Configuration Options
-===========================
+=====================================
+Streaming Write Configuration Options
+=====================================
 
 .. contents:: On this page
    :local:
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index 16726518..d2a70e15 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -5,7 +5,7 @@ Write to MongoDB
 ================
 
 .. toctree::
-   :caption: Write Configuration Options
+   :caption: Streaming Write Configuration Options
 
    /streaming-mode/streaming-write-config
 
@@ -16,11 +16,11 @@ Write to MongoDB
      - id: java-sync
        content: |
 
-        To write data to MongoDB, call the ``writeStream()`` method on your
-        DataFrame object. This method returns a
-        ``DataStreamWriter``
-        object, which you can use to specify the format and other configuration settings
-        for your streaming write operation. 
+         To write data to MongoDB, call the ``writeStream()`` method on your
+         DataFrame object. This method returns a
+         ``DataStreamWriter``
+         object, which you can use to specify the format and other configuration settings
+         for your streaming write operation. 
 
          You must specify the following configuration settings to write to MongoDB:
          
@@ -84,11 +84,11 @@ Write to MongoDB
      - id: python
        content: |
 
-        To write data to MongoDB, call the ``writeStream`` function on your
-        DataFrame object. This function returns a
-        ``DataStreamWriter``
-        object, which you can use to specify the format and other configuration settings for your
-        streaming write operation. 
+         To write data to MongoDB, call the ``writeStream`` function on your
+         DataFrame object. This function returns a
+         ``DataStreamWriter``
+         object, which you can use to specify the format and other configuration settings for your
+         streaming write operation. 
 
          You must specify the following configuration settings to write to MongoDB:
 
@@ -151,11 +151,11 @@ Write to MongoDB
      - id: scala
        content: |
 
-        To write data to MongoDB, call the ``write`` method on your
-        DataFrame object. This method returns a
-        ``DataStreamWriter``
-        object, which you can use to specify the format and other configuration settings
-        for your streaming write operation. 
+         To write data to MongoDB, call the ``write`` method on your
+         DataFrame object. This method returns a
+         ``DataStreamWriter``
+         object, which you can use to specify the format and other configuration settings
+         for your streaming write operation. 
 
          You must specify the following configuration settings to write to MongoDB:
 

From 6d4a3b3815c7c415c6bf3f281f86c47b4fc05f53 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 15:34:07 -0500
Subject: [PATCH 51/65] configexception

---
 source/configuration.txt | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/source/configuration.txt b/source/configuration.txt
index 0eeeb43d..24e99bed 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -122,6 +122,9 @@ Using a System Property
 The {+connector-short+} reads some configuration settings before ``SparkConf`` is
 available. You must specify these settings by using a JVM system property.
 
-.. tip:: System Properties
+For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
 
-   For more information on Java system properties, see the `Java documentation. <https://docs.oracle.com/javase/tutorial/essential/environment/sysprop.html>`__
+.. tip:: Configuration Exceptions
+
+   If the {+connector-short+} throws a ``ConfigException``, confirm that your ``SparkConf``
+   or options map uses correct syntax and contains only valid configuration options.
\ No newline at end of file

From 392f8ce4469b038f59f2e5fe7da7fe2e0f2195ca Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 15:39:55 -0500
Subject: [PATCH 52/65] vale fixes

---
 source/includes/extracts-command-line.yaml      | 2 +-
 source/streaming-mode/streaming-read-config.txt | 8 ++++----
 source/streaming-mode/streaming-write.txt       | 4 ++--
 3 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/source/includes/extracts-command-line.yaml b/source/includes/extracts-command-line.yaml
index f0d4b8db..c647a0f5 100644
--- a/source/includes/extracts-command-line.yaml
+++ b/source/includes/extracts-command-line.yaml
@@ -10,7 +10,7 @@ content: |
 
     .. note:: 
 
-       When specifying the Connector configuration via ``SparkConf``, you
+       If you use ``SparkConf`` to configure the {+connector-short+}, you
        must prefix the settings appropriately. For details and other
        available MongoDB Spark Connector options, see the
        :doc:`/configuration`.
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index af5b0f1e..2f1916b3 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -56,13 +56,13 @@ You can configure the following properties when reading data from MongoDB in str
          before sending data to Spark.
        | The value must be either an extended JSON single document or list
          of documents.
-       | A single document should resemble the following:
+       | A single document resembles the following:
 
        .. code-block:: json
 
           {"$match": {"closed": false}}
 
-       | A list of documents should resemble the following:
+       | A list of documents resembles the following:
 
        .. code-block:: json
 
@@ -117,8 +117,8 @@ You can configure the following properties when reading a change stream from Mon
        The default setting returns the differences between the original
        document and the updated document.
 
-       The ``updateLookup`` setting returns the differences between the
-       original document and updated document as well as a copy of the
+       The ``updateLookup`` setting also returns the differences between the
+       original document and updated document, but it also includes a copy of the
        entire updated document.
 
        **Default:** "default"
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index d2a70e15..e4550967 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -54,8 +54,8 @@ Write to MongoDB
                 to the streaming sink. 
                 
                 To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-                as an argument, where ``<time value>`` is how often the Spark Connector 
-                should asynchronously checkpoint. If you 
+                as an argument, where ``<time value>`` is how often you want the Spark
+                Connector to asynchronously checkpoint. If you 
                 pass any other static method of the ``Trigger`` class, or if you don't 
                 call ``writeStream.trigger()``, the Spark connector uses 
                 micro-batch processing instead. 

From 776ce654d5314887d34c1d494044afe456a7b7dc Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Fri, 20 Oct 2023 15:45:47 -0500
Subject: [PATCH 53/65] vale/style guide

---
 source/batch-mode/batch-read-config.txt   |  4 ++--
 source/faq.txt                            | 12 ++++++------
 source/streaming-mode/streaming-write.txt |  4 ++--
 3 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index 4ceaf3d5..3a5a3915 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -92,13 +92,13 @@ You can configure the following properties when reading data from MongoDB in bat
          before sending data to Spark.
        | The value must be either an extended JSON single document or list
          of documents.
-       | A single document should resemble the following:
+       | A single document resembles the following:
 
        .. code-block:: json
 
           {"$match": {"closed": false}}
 
-       | A list of documents should resemble the following:
+       | A list of documents resembles the following:
 
        .. code-block:: json
 
diff --git a/source/faq.txt b/source/faq.txt
index f48cd135..f41089cc 100644
--- a/source/faq.txt
+++ b/source/faq.txt
@@ -7,24 +7,24 @@ FAQ
 How can I achieve data locality?
 --------------------------------
 
-For any MongoDB deployment, the Mongo Spark Connector sets the
-preferred location for a DataFrame or Dataset to be where the data is:
+For any MongoDB deployment, the {+connector-short+} sets the
+preferred location for a DataFrame or Dataset to be where the data is.
 
-- For a non sharded system, it sets the preferred location to be the
+- For a nonsharded system, it sets the preferred location to be the
   hostname(s) of the standalone or the replica set.
 
 - For a sharded system, it sets the preferred location to be the
   hostname(s) of the shards.
 
-To promote data locality,
+To promote data locality, we recommend taking the following actions:
 
-- Ensure there is a Spark Worker on one of the hosts for non-sharded
+- Ensure there is a Spark Worker on one of the hosts for nonsharded
   system or one per shard for sharded systems.
 
 - Use a :readmode:`nearest` read preference to read from the local
   :binary:`~bin.mongod`.
 
-- For a sharded cluster, you should have a :binary:`~bin.mongos` on the
+- For a sharded cluster, have a :binary:`~bin.mongos` on the
   same nodes and use the ``localThreshold``
   configuration setting to connect to the nearest :binary:`~bin.mongos`. 
   To partition the data by shard use the 
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index e4550967..d6aeddf9 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -189,8 +189,8 @@ Write to MongoDB
                 to the streaming sink.
 
                 To use continuous processing, pass ``Trigger.Continuous(<time value>)`` 
-                as an argument, where ``<time value>`` is how often the Spark Connector 
-                should asynchronously checkpoint. If you 
+                as an argument, where ``<time value>`` is how often you want the Spark
+                Connector to asynchronously checkpoint. If you 
                 pass any other static method of the ``Trigger`` class, or if you don't 
                 call ``writeStream.trigger()``, the Spark connector uses
                 micro-batch processing instead. 

From ebc29c8605878e8294be97c5627adf62c0d70490 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 30 Oct 2023 15:44:27 -0500
Subject: [PATCH 54/65] pa review

---
 source/faq.txt                             | 2 --
 source/includes/connection-read-config.rst | 4 ++--
 source/streaming-mode.txt                  | 6 ++++--
 3 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/source/faq.txt b/source/faq.txt
index f41089cc..8f38f3a6 100644
--- a/source/faq.txt
+++ b/source/faq.txt
@@ -2,8 +2,6 @@
 FAQ
 ===
 
-.. default-domain:: mongodb
-
 How can I achieve data locality?
 --------------------------------
 
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index 60de1396..65cbe94d 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -1,5 +1,5 @@
-Specifying Properties in ``connection.uri``
--------------------------------------------
+Specifying Properties in connection.uri
+---------------------------------------
 
 If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
 can either list them individually or include them in the ``connection.uri`` setting.
diff --git a/source/streaming-mode.txt b/source/streaming-mode.txt
index ad5dfcca..456695f6 100644
--- a/source/streaming-mode.txt
+++ b/source/streaming-mode.txt
@@ -18,8 +18,10 @@ Streaming Mode
 Overview
 --------
 
-In streaming mode, you can use Spark Structured Streaming to process data as soon as
-it's available instead of waiting for a time interval to pass.
+The {+connector-short+} supports streaming mode, which uses Spark Structured Streaming
+to process data as soon as it's available instead of waiting for a time interval to pass.
+Spark Structured Streaming is a data-stream-processing engine that you can access by using
+the Dataset or DataFrame API. 
 
 .. include:: includes/streaming-distinction.rst
 

From 5452d7b185fa7eef3ec932c07c28789e97405b68 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 31 Oct 2023 09:32:49 -0500
Subject: [PATCH 55/65] pa feedback

---
 source/batch-mode/batch-read.txt           | 8 ++++----
 source/batch-mode/batch-write.txt          | 6 +++---
 source/includes/connection-read-config.rst | 4 ++--
 source/python/write-to-mongodb.txt         | 3 ++-
 source/streaming-mode/streaming-read.txt   | 6 +++---
 source/streaming-mode/streaming-write.txt  | 6 +++---
 6 files changed, 17 insertions(+), 16 deletions(-)

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 2eb1889c..9356ac24 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -1,8 +1,8 @@
 .. _batch-read-from-mongodb:
 
-=================
-Read from MongoDB
-=================
+===============================
+Read from MongoDB in Batch Mode
+===============================
 
 .. toctree::
    :caption: Batch Read Configuration Options
@@ -12,7 +12,7 @@ Read from MongoDB
 .. contents:: On this page
    :local:
    :backlinks: none
-   :depth: 1
+   :depth: 2
    :class: singlecol 
 
 Overview
diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index 3e5b8cbc..fbddb8e6 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -1,8 +1,8 @@
 .. _batch-write-to-mongodb:
 
-================
-Write to MongoDB
-================
+==============================
+Write to MongoDB in Batch Mode
+==============================
 
 .. toctree::
    :caption: Batch Write Configuration Options
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index 65cbe94d..60de1396 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -1,5 +1,5 @@
-Specifying Properties in connection.uri
----------------------------------------
+Specifying Properties in ``connection.uri``
+-------------------------------------------
 
 If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
 can either list them individually or include them in the ``connection.uri`` setting.
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index 19a9c502..fdf8519b 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -6,7 +6,8 @@ batch write operation.
 
 .. include:: /includes/batch-write-settings.rst
 
-The following example creates a DataFrame from a list of tuples containing names
+The following example uses the ``createDataFrame()`` function on the ``SparkSession``
+object to create a DataFrame from a list of tuples containing names
 and ages and a list of column names. The example then writes this DataFrame to the
 ``people.contacts`` collection in MongoDB.
 
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index 443a047e..cc3032a5 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -1,8 +1,8 @@
 .. _streaming-read-from-mongodb: 
 
-=================
-Read from MongoDB
-=================
+===================================
+Read from MongoDB in Streaming Mode
+===================================
 
 .. toctree::
    :caption: Streaming Read Configuration Options
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index d6aeddf9..ba4e5f19 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -1,8 +1,8 @@
 .. _streaming-write-to-mongodb:
 
-================
-Write to MongoDB
-================
+==================================
+Write to MongoDB in Streaming Mode
+==================================
 
 .. toctree::
    :caption: Streaming Write Configuration Options

From 0bce65d6f49dc15371f1de851f81d56b1ec84464 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 31 Oct 2023 09:40:21 -0500
Subject: [PATCH 56/65] tab test

---
 source/batch-mode/batch-read.txt | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 9356ac24..2be9db94 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -18,6 +18,8 @@ Read from MongoDB in Batch Mode
 Overview
 --------
 
+.. tabs-selector:: drivers
+
 .. tabs-drivers::
 
    tabs:

From 0260735b8aa5bf675c4d8a88289fb2a0d0b800c2 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 31 Oct 2023 11:18:30 -0500
Subject: [PATCH 57/65] move inference and filters

---
 source/batch-mode/batch-read.txt    | 44 ++++++++++++++++---
 source/java/read-from-mongodb.txt   | 66 -----------------------------
 source/java/schema-inference.rst    | 62 +++++++++++++++++++++++++++
 source/python/filters.txt           |  3 --
 source/python/read-from-mongodb.txt | 64 ----------------------------
 source/python/schema-inference.rst  | 62 +++++++++++++++++++++++++++
 source/scala/filters.txt            |  3 --
 source/scala/read-from-mongodb.txt  | 66 -----------------------------
 source/scala/schema-inference.rst   | 62 +++++++++++++++++++++++++++
 9 files changed, 224 insertions(+), 208 deletions(-)
 create mode 100644 source/java/schema-inference.rst
 create mode 100644 source/python/schema-inference.rst
 create mode 100644 source/scala/schema-inference.rst

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index 2be9db94..cacad3f9 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -12,14 +12,12 @@ Read from MongoDB in Batch Mode
 .. contents:: On this page
    :local:
    :backlinks: none
-   :depth: 2
+   :depth: 1
    :class: singlecol 
 
 Overview
 --------
 
-.. tabs-selector:: drivers
-
 .. tabs-drivers::
 
    tabs:
@@ -33,15 +31,49 @@ Overview
 
          .. include:: /python/read-from-mongodb.txt
 
-         .. include:: /python/filters.txt
-
      - id: scala
        content: |
 
          .. include:: /scala/read-from-mongodb.txt
 
-         .. include:: /scala/filters.txt
+Schema Inference
+----------------
 
+.. tabs-drivers::
+
+   tabs:
+     - id: java-sync
+       content: |
+
+         .. include:: /java/schema-inference.rst
+
+     - id: python
+       content: |
+
+         .. include:: /python/schema-inference.rst
+
+     - id: scala
+       content: |
+
+         .. include:: /scala/schema-inference.rst
+
+Filters
+-------
+
+.. tabs-drivers::
+
+   tabs:
+
+     - id: python
+       content: |
+
+         .. include:: /python/filters.txt
+
+     - id: scala
+       content: |
+
+         .. include:: /scala/filters.txt
+         
 SQL Queries
 -----------
 
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index 5899400a..b3bfa100 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -17,69 +17,3 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
                           .load();
 
 .. include:: /includes/java-dataframe-tip.rst
-
-.. _java-implicit-schema:
-
-Schema Inference
-----------------
-
-.. include:: /includes/schema-inference-intro.rst
-
-.. code-block:: java
-   
-   Dataset<Row> dataFrame = spark.read()
-                                 .format("mongodb")
-                                 .option("database", "people")
-                                 .option("collection", "contacts")
-                                 .load();
-
-To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
-the following example:
-
-.. io-code-block::
-   :copyable: true
-
-   .. input::
-      :language: java
-
-      dataFrame.printSchema();
-   
-   .. output::
-      :language: none
-      :visible: false
-
-      root
-       |-- _id: struct (nullable = true)
-       |    |-- oid: string (nullable = true)
-       |-- age: integer (nullable = true)
-       |-- name: string (nullable = true)
- 
-To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
-the following example:
-
-.. io-code-block::
-   :copyable: true
-
-   .. input::
-      :language: java
-
-      dataFrame.show();
-   
-   .. output::
-      :language: none
-      :visible: false
-
-      +--------------------+----+-------------+
-      |                 _id| age|         name|
-      +--------------------+----+-------------+
-      |[585024d558bef808...|  50|Bilbo Baggins|
-      |[585024d558bef808...|1000|      Gandalf|
-      |[585024d558bef808...| 195|       Thorin|
-      |[585024d558bef808...| 178|        Balin|
-      |[585024d558bef808...|  77|         Kíli|
-      |[585024d558bef808...| 169|       Dwalin|
-      |[585024d558bef808...| 167|          Óin|
-      |[585024d558bef808...| 158|        Glóin|
-      |[585024d558bef808...|  82|         Fíli|
-      |[585024d558bef808...|null|       Bombur|
-      +--------------------+----+-------------+
\ No newline at end of file
diff --git a/source/java/schema-inference.rst b/source/java/schema-inference.rst
new file mode 100644
index 00000000..06b1475b
--- /dev/null
+++ b/source/java/schema-inference.rst
@@ -0,0 +1,62 @@
+.. _java-schema-inference:
+
+.. include:: /includes/schema-inference-intro.rst
+
+.. code-block:: java
+   
+   Dataset<Row> dataFrame = spark.read()
+                                 .format("mongodb")
+                                 .option("database", "people")
+                                 .option("collection", "contacts")
+                                 .load();
+
+To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: java
+
+      dataFrame.printSchema();
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      root
+       |-- _id: struct (nullable = true)
+       |    |-- oid: string (nullable = true)
+       |-- age: integer (nullable = true)
+       |-- name: string (nullable = true)
+ 
+To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: java
+
+      dataFrame.show();
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      +--------------------+----+-------------+
+      |                 _id| age|         name|
+      +--------------------+----+-------------+
+      |[585024d558bef808...|  50|Bilbo Baggins|
+      |[585024d558bef808...|1000|      Gandalf|
+      |[585024d558bef808...| 195|       Thorin|
+      |[585024d558bef808...| 178|        Balin|
+      |[585024d558bef808...|  77|         Kíli|
+      |[585024d558bef808...| 169|       Dwalin|
+      |[585024d558bef808...| 167|          Óin|
+      |[585024d558bef808...| 158|        Glóin|
+      |[585024d558bef808...|  82|         Fíli|
+      |[585024d558bef808...|null|       Bombur|
+      +--------------------+----+-------------+
diff --git a/source/python/filters.txt b/source/python/filters.txt
index 124ef886..4a4bcdf8 100644
--- a/source/python/filters.txt
+++ b/source/python/filters.txt
@@ -1,6 +1,3 @@
-Filters
--------
-
 .. include:: includes/pushed-filters.rst
 
 Use ``filter()`` to read a subset of data from your MongoDB collection.
diff --git a/source/python/read-from-mongodb.txt b/source/python/read-from-mongodb.txt
index 1870538f..ce8b0a59 100644
--- a/source/python/read-from-mongodb.txt
+++ b/source/python/read-from-mongodb.txt
@@ -16,67 +16,3 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
                     .option("database", "people")
                     .option("collection", "contacts")
                     .load()
-
-Schema Inference
-----------------
-
-.. include:: /includes/schema-inference-intro.rst
-
-.. code-block:: python
-   
-   dataFrame = spark.read
-                    .format("mongodb")
-                    .option("database", "people")
-                    .option("collection", "contacts")
-                    .load()
-
-To see the inferred schema, use the ``dataFrame.printSchema()`` function, as shown in
-the following example:
-
-.. io-code-block::
-   :copyable: true
-
-   .. input::
-      :language: python
-
-      dataFrame.printSchema()
-   
-   .. output::
-      :language: none
-      :visible: false
-
-      root
-       |-- _id: struct (nullable = true)
-       |    |-- oid: string (nullable = true)
-       |-- age: integer (nullable = true)
-       |-- name: string (nullable = true)
- 
-To see the data in the DataFrame, use the ``dataFrame.show()`` function, as shown in
-the following example:
-
-.. io-code-block::
-   :copyable: true
-
-   .. input::
-      :language: python
-
-      dataFrame.show()
-   
-   .. output::
-      :language: none
-      :visible: false
-
-      +--------------------+----+-------------+
-      |                 _id| age|         name|
-      +--------------------+----+-------------+
-      |[585024d558bef808...|  50|Bilbo Baggins|
-      |[585024d558bef808...|1000|      Gandalf|
-      |[585024d558bef808...| 195|       Thorin|
-      |[585024d558bef808...| 178|        Balin|
-      |[585024d558bef808...|  77|         Kíli|
-      |[585024d558bef808...| 169|       Dwalin|
-      |[585024d558bef808...| 167|          Óin|
-      |[585024d558bef808...| 158|        Glóin|
-      |[585024d558bef808...|  82|         Fíli|
-      |[585024d558bef808...|null|       Bombur|
-      +--------------------+----+-------------+
\ No newline at end of file
diff --git a/source/python/schema-inference.rst b/source/python/schema-inference.rst
new file mode 100644
index 00000000..69f4fae2
--- /dev/null
+++ b/source/python/schema-inference.rst
@@ -0,0 +1,62 @@
+.. _python-schema-inference:
+
+.. include:: /includes/schema-inference-intro.rst
+
+.. code-block:: python
+   
+   dataFrame = spark.read
+                    .format("mongodb")
+                    .option("database", "people")
+                    .option("collection", "contacts")
+                    .load()
+
+To see the inferred schema, use the ``dataFrame.printSchema()`` function, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: python
+
+      dataFrame.printSchema()
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      root
+       |-- _id: struct (nullable = true)
+       |    |-- oid: string (nullable = true)
+       |-- age: integer (nullable = true)
+       |-- name: string (nullable = true)
+ 
+To see the data in the DataFrame, use the ``dataFrame.show()`` function, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: python
+
+      dataFrame.show()
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      +--------------------+----+-------------+
+      |                 _id| age|         name|
+      +--------------------+----+-------------+
+      |[585024d558bef808...|  50|Bilbo Baggins|
+      |[585024d558bef808...|1000|      Gandalf|
+      |[585024d558bef808...| 195|       Thorin|
+      |[585024d558bef808...| 178|        Balin|
+      |[585024d558bef808...|  77|         Kíli|
+      |[585024d558bef808...| 169|       Dwalin|
+      |[585024d558bef808...| 167|          Óin|
+      |[585024d558bef808...| 158|        Glóin|
+      |[585024d558bef808...|  82|         Fíli|
+      |[585024d558bef808...|null|       Bombur|
+      +--------------------+----+-------------+
diff --git a/source/scala/filters.txt b/source/scala/filters.txt
index 924de663..5208f29c 100644
--- a/source/scala/filters.txt
+++ b/source/scala/filters.txt
@@ -1,6 +1,3 @@
-Filters
--------
-
 .. include:: /includes/pushed-filters.rst
 
 The following example filters and output the characters with ages under
diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index 895b24fc..8e1cc04a 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -21,69 +21,3 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
    
    A DataFrame is a Dataset of ``Row`` objects.
    The ``DataFrame`` type is an alias for ``Dataset[Row]``.
-
-.. _scala-implicit-schema:
-
-Schema Inference
-----------------
-
-.. include:: /includes/schema-inference-intro.rst
-
-.. code-block:: scala
-   
-   val dataFrame = spark.read()
-                        .format("mongodb")
-                        .option("database", "people")
-                        .option("collection", "contacts")
-                        .load()
-
-To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
-the following example:
-
-.. io-code-block::
-   :copyable: true
-
-   .. input::
-      :language: scala
-
-      dataFrame.printSchema()
-   
-   .. output::
-      :language: none
-      :visible: false
-
-      root
-       |-- _id: struct (nullable = true)
-       |    |-- oid: string (nullable = true)
-       |-- age: integer (nullable = true)
-       |-- name: string (nullable = true)
- 
-To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
-the following example:
-
-.. io-code-block::
-   :copyable: true
-
-   .. input::
-      :language: scala
-
-      dataFrame.show()
-   
-   .. output::
-      :language: none
-      :visible: false
-
-      +--------------------+----+-------------+
-      |                 _id| age|         name|
-      +--------------------+----+-------------+
-      |[585024d558bef808...|  50|Bilbo Baggins|
-      |[585024d558bef808...|1000|      Gandalf|
-      |[585024d558bef808...| 195|       Thorin|
-      |[585024d558bef808...| 178|        Balin|
-      |[585024d558bef808...|  77|         Kíli|
-      |[585024d558bef808...| 169|       Dwalin|
-      |[585024d558bef808...| 167|          Óin|
-      |[585024d558bef808...| 158|        Glóin|
-      |[585024d558bef808...|  82|         Fíli|
-      |[585024d558bef808...|null|       Bombur|
-      +--------------------+----+-------------+
\ No newline at end of file
diff --git a/source/scala/schema-inference.rst b/source/scala/schema-inference.rst
new file mode 100644
index 00000000..1f961631
--- /dev/null
+++ b/source/scala/schema-inference.rst
@@ -0,0 +1,62 @@
+.. _scala-schema-inference:
+
+.. include:: /includes/schema-inference-intro.rst
+
+.. code-block:: scala
+   
+   val dataFrame = spark.read()
+                        .format("mongodb")
+                        .option("database", "people")
+                        .option("collection", "contacts")
+                        .load()
+
+To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: scala
+
+      dataFrame.printSchema()
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      root
+       |-- _id: struct (nullable = true)
+       |    |-- oid: string (nullable = true)
+       |-- age: integer (nullable = true)
+       |-- name: string (nullable = true)
+ 
+To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
+the following example:
+
+.. io-code-block::
+   :copyable: true
+
+   .. input::
+      :language: scala
+
+      dataFrame.show()
+   
+   .. output::
+      :language: none
+      :visible: false
+
+      +--------------------+----+-------------+
+      |                 _id| age|         name|
+      +--------------------+----+-------------+
+      |[585024d558bef808...|  50|Bilbo Baggins|
+      |[585024d558bef808...|1000|      Gandalf|
+      |[585024d558bef808...| 195|       Thorin|
+      |[585024d558bef808...| 178|        Balin|
+      |[585024d558bef808...|  77|         Kíli|
+      |[585024d558bef808...| 169|       Dwalin|
+      |[585024d558bef808...| 167|          Óin|
+      |[585024d558bef808...| 158|        Glóin|
+      |[585024d558bef808...|  82|         Fíli|
+      |[585024d558bef808...|null|       Bombur|
+      +--------------------+----+-------------+

From ad08c26e76efa14075053bebef61f1d1bf2962b6 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 31 Oct 2023 13:18:58 -0500
Subject: [PATCH 58/65] resize heading

---
 source/batch-mode/batch-read-config.txt    | 3 +++
 source/includes/connection-read-config.rst | 3 ---
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index 3a5a3915..4b7d58ac 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -282,4 +282,7 @@ The ``SinglePartitionPartitioner`` configuration creates a single partition.
 To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
 
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
 .. include:: /includes/connection-read-config.rst
\ No newline at end of file
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index 60de1396..cc6ff985 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -1,6 +1,3 @@
-Specifying Properties in ``connection.uri``
--------------------------------------------
-
 If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
 can either list them individually or include them in the ``connection.uri`` setting.
 

From c0a08da68dbc4bda8bf940ead8560809dc8199e2 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 31 Oct 2023 16:19:51 -0500
Subject: [PATCH 59/65] redirects

---
 config/redirects | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/config/redirects b/config/redirects
index 8c5cf780..0834af9f 100644
--- a/config/redirects
+++ b/config/redirects
@@ -61,4 +61,9 @@ raw: ${prefix}/sparkR -> ${base}/v3.0/r-api/
 [*-v3.0]: ${prefix}/${version}/configuration/read -> ${base}/${version}/
 [*-v3.0]: ${prefix}/${version}/write-to-mongodb -> ${base}/${version}/
 [*-v3.0]: ${prefix}/${version}/read-from-mongodb -> ${base}/${version}/
-[*-v3.0]: ${prefix}/${version}/structured-streaming -> ${base}/${version}/
\ No newline at end of file
+[*-v3.0]: ${prefix}/${version}/structured-streaming -> ${base}/${version}/
+[v10.0-*]: ${prefix}/${version}/configuration/write -> ${base}/${version}/batch-mode/batch-write-config/
+[v10.0-*]: ${prefix}/${version}/configuration/read -> ${base}/${version}/batch-mode/batch-read-config/
+[v10.0-*]: ${prefix}/${version}/write-to-mongodb -> ${base}/${version}/batch-mode/batch-write/
+[v10.0-*]: ${prefix}/${version}/read-from-mongodb -> ${base}/${version}/batch-mode/batch-read/
+[v10.0-*]: ${prefix}/${version}/structured-streaming -> ${base}/${version}/streaming-mode/
\ No newline at end of file

From ad4d71678b487f76dcdda0261e0388cd33bec099 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Mon, 13 Nov 2023 17:09:58 -0600
Subject: [PATCH 60/65] js feedback

---
 source/batch-mode/batch-read-config.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index 4b7d58ac..fbf2e593 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -12,6 +12,9 @@ Batch Read Configuration Options
 
 .. _spark-batch-input-conf:
 
+Overview
+--------
+
 You can configure the following properties when reading data from MongoDB in batch mode.
 
 .. include:: /includes/conf-read-prefix.rst

From 5531caecddeb03b33913194d3914588ca895a410 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 14 Nov 2023 10:41:33 -0600
Subject: [PATCH 61/65] js feedback

---
 source/batch-mode/batch-read-config.txt       |  3 ---
 source/configuration.txt                      |  7 +++--
 source/faq.txt                                |  2 +-
 source/includes/connection-read-config.rst    | 27 ++++++++++---------
 source/includes/connection-write-config.rst   | 24 +++++++++--------
 source/includes/extracts-command-line.yaml    |  2 +-
 .../includes/scala-java-explicit-schema.rst   |  2 +-
 .../scala-java-sparksession-config.rst        |  2 +-
 .../scala-java-sql-register-table.rst         |  4 +--
 source/includes/streaming-distinction.rst     |  8 +++---
 source/includes/warn-console-stream.rst       |  2 +-
 source/index.txt                              |  2 +-
 source/java/read-from-mongodb.txt             |  2 +-
 source/java/schema-inference.rst              |  8 +++---
 source/java/write-to-mongodb.txt              |  2 +-
 source/python/filters.txt                     |  2 +-
 source/python/read-from-mongodb.txt           |  2 +-
 source/python/schema-inference.rst            |  8 +++---
 source/python/write-to-mongodb.txt            |  6 ++---
 source/scala/api.txt                          |  6 ++---
 source/scala/read-from-mongodb.txt            |  4 +--
 source/scala/schema-inference.rst             |  8 +++---
 source/scala/write-to-mongodb.txt             |  2 +-
 source/streaming-mode/streaming-read.txt      | 12 ++++-----
 source/streaming-mode/streaming-write.txt     | 14 +++++-----
 25 files changed, 84 insertions(+), 77 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index fbf2e593..9de489a1 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -285,7 +285,4 @@ The ``SinglePartitionPartitioner`` configuration creates a single partition.
 To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
 
-Specifying Properties in ``connection.uri``
--------------------------------------------
-
 .. include:: /includes/connection-read-config.rst
\ No newline at end of file
diff --git a/source/configuration.txt b/source/configuration.txt
index 24e99bed..1b57b62e 100644
--- a/source/configuration.txt
+++ b/source/configuration.txt
@@ -10,6 +10,9 @@ Configuring Spark
    :depth: 1
    :class: singlecol
 
+Overview
+--------
+
 You can configure read and write operations in both batch and streaming mode.
 To learn more about the available configuration options, see the following
 pages:
@@ -62,8 +65,8 @@ defaults.
 Using an Options Map
 ~~~~~~~~~~~~~~~~~~~~
 
-In the Spark API, the DataFrameReader, DataFrameWriter, DataStreamReader,
-and DataStreamWriter classes each contain an ``option()`` method. You can use
+In the Spark API, the ``DataFrameReader``, ``DataFrameWriter``, ``DataStreamReader``,
+and ``DataStreamWriter`` classes each contain an ``option()`` method. You can use
 this method to specify options for the underlying read or write operation.
 
 .. note::
diff --git a/source/faq.txt b/source/faq.txt
index 8f38f3a6..b4791301 100644
--- a/source/faq.txt
+++ b/source/faq.txt
@@ -34,7 +34,7 @@ How do I resolve ``Unrecognized pipeline stage name`` Error?
 In MongoDB deployments with mixed versions of :binary:`~bin.mongod`, it is
 possible to get an ``Unrecognized pipeline stage name: '$sample'``
 error. To mitigate this situation, explicitly configure the partitioner
-to use and define the Schema when using DataFrames.
+to use and define the schema when using DataFrames.
 
 How can I use mTLS for authentication?
 --------------------------------------
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index cc6ff985..53c826c5 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -1,29 +1,32 @@
-If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
-can either list them individually or include them in the ``connection.uri`` setting.
+Specifying Properties in ``connection.uri``
+-------------------------------------------
 
-The following code example shows how to specify the ``connection.uri``,
-``database``, ``collection``, and ``readPreference`` settings individually in a
-``SparkConf`` configuration file:
+If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you can
+either include them in the ``connection.uri`` setting or list them individually.
+
+The following code example shows how to specify the
+database, collection, and read preference as part of the ``connection.uri`` setting:
 
 .. code:: cfg
 
-   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
-   spark.mongodb.read.database=test
-   spark.mongodb.read.collection=myCollection
-   spark.mongodb.read.readPreference.name=primaryPreferred
+  spark.mongodb.read.connection.uri=mongodb://127.0.0.1/myDB.myCollection?readPreference=primaryPreferred
 
-Instead, you can specify these settings in the value of ``connection.uri``:
+To keep the ``connection.uri`` shorter and make the settings easier to read, you can
+specify them individually instead:
 
 .. code:: cfg
 
-  spark.mongodb.read.connection.uri=mongodb://127.0.0.1/test.myCollection?readPreference=primaryPreferred
+   spark.mongodb.read.connection.uri=mongodb://127.0.0.1/
+   spark.mongodb.read.database=myDB
+   spark.mongodb.read.collection=myCollection
+   spark.mongodb.read.readPreference.name=primaryPreferred
 
 .. important::
 
    If you specify a setting in both the ``connection.uri`` and on its own line,
    the ``connection.uri`` setting takes precedence.
    For example, in the following configuration, the connection
-   database is ``foobar``:
+   database is ``foobar``, because it's the value in the ``connection.uri`` setting:
 
    .. code:: cfg
 
diff --git a/source/includes/connection-write-config.rst b/source/includes/connection-write-config.rst
index 3668d737..d47a47e4 100644
--- a/source/includes/connection-write-config.rst
+++ b/source/includes/connection-write-config.rst
@@ -1,25 +1,27 @@
 Specifying Properties in ``connection.uri``
 -------------------------------------------
 
-If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you
-can either list them individually or include them in the ``connection.uri`` setting.
+If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you can
+either include them in the ``connection.uri`` setting or list them individually.
 
-The following code example shows how to specify the ``connection.uri``,
-``database``, ``collection``, and ``convertJson`` settings individually in a
-``SparkConf`` configuration file:
+The following code example shows how to specify the
+database, collection, and ``convertJson`` setting as part of the ``connection.uri``
+setting: 
 
 .. code:: cfg
 
-   spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
-   spark.mongodb.write.database=test
-   spark.mongodb.write.collection=myCollection
-   spark.mongodb.write.convertJson=any
+  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/myDB.myCollection?convertJson=any
+
 
-Instead, you can specify these settings in the value of ``connection.uri``:
+To keep the ``connection.uri`` shorter and make the settings easier to read, you can
+specify them individually instead:
 
 .. code:: cfg
 
-  spark.mongodb.write.connection.uri=mongodb://127.0.0.1/test.myCollection?convertJson=any
+   spark.mongodb.write.connection.uri=mongodb://127.0.0.1/
+   spark.mongodb.write.database=myDB
+   spark.mongodb.write.collection=myCollection
+   spark.mongodb.write.convertJson=any
 
 .. important::
 
diff --git a/source/includes/extracts-command-line.yaml b/source/includes/extracts-command-line.yaml
index c647a0f5..fe284431 100644
--- a/source/includes/extracts-command-line.yaml
+++ b/source/includes/extracts-command-line.yaml
@@ -13,7 +13,7 @@ content: |
        If you use ``SparkConf`` to configure the {+connector-short+}, you
        must prefix the settings appropriately. For details and other
        available MongoDB Spark Connector options, see the
-       :doc:`/configuration`.
+       :doc:`/configuration` guide.
 ---
 ref: list-configuration-explanation
 content: |
diff --git a/source/includes/scala-java-explicit-schema.rst b/source/includes/scala-java-explicit-schema.rst
index 3e1109a5..3b682cb1 100644
--- a/source/includes/scala-java-explicit-schema.rst
+++ b/source/includes/scala-java-explicit-schema.rst
@@ -10,4 +10,4 @@ queries needed for sampling.
    wire.
    
 The following statement creates a ``Character`` |class| and then
-uses it to define the schema for the ``DataFrame``:
+uses it to define the schema for the DataFrame:
diff --git a/source/includes/scala-java-sparksession-config.rst b/source/includes/scala-java-sparksession-config.rst
index 665aebc7..839bd561 100644
--- a/source/includes/scala-java-sparksession-config.rst
+++ b/source/includes/scala-java-sparksession-config.rst
@@ -1,4 +1,4 @@
 When specifying the Connector configuration via ``SparkSession``, you
 must prefix the settings appropriately. For details and other
 available MongoDB Spark Connector options, see the
-:doc:`/configuration`.
+:doc:`/configuration` guide.
diff --git a/source/includes/scala-java-sql-register-table.rst b/source/includes/scala-java-sql-register-table.rst
index 8eb0705a..5bcbe95b 100644
--- a/source/includes/scala-java-sql-register-table.rst
+++ b/source/includes/scala-java-sql-register-table.rst
@@ -1,5 +1,5 @@
-Before running SQL queries on your dataset, you must register a
-temporary view for the dataset. 
+Before running SQL queries on your Dataset, you must register a
+temporary view for the Dataset. 
 
 The following operation registers a
 ``characters`` table and then queries it to find all characters that
diff --git a/source/includes/streaming-distinction.rst b/source/includes/streaming-distinction.rst
index ed5bd3f4..2448decd 100644
--- a/source/includes/streaming-distinction.rst
+++ b/source/includes/streaming-distinction.rst
@@ -1,8 +1,10 @@
 .. important::
 
    Apache Spark contains two different stream-processing engines:
-   `Spark Streaming with DStreams <https://spark.apache.org/docs/latest/streaming-programming-guide.html>`__,
-   now an unsupported legacy engine, and
-   `Spark Structured Streaming <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.
+   
+   - `Spark Streaming with DStreams <https://spark.apache.org/docs/latest/streaming-programming-guide.html>`__,
+     now an unsupported legacy engine
+   
+   - `Spark Structured Streaming <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html>`__.
 
    This guide pertains only to Spark Structured Streaming. 
\ No newline at end of file
diff --git a/source/includes/warn-console-stream.rst b/source/includes/warn-console-stream.rst
index b46d586d..4bf16d7d 100644
--- a/source/includes/warn-console-stream.rst
+++ b/source/includes/warn-console-stream.rst
@@ -1,4 +1,4 @@
 .. important::
 
-   Avoid streaming large datasets to your console. Streaming to your 
+   Avoid streaming large Datasets to your console. Streaming to your 
    console is memory intensive and intended only for testing purposes. 
diff --git a/source/index.txt b/source/index.txt
index 1525688c..df17674b 100644
--- a/source/index.txt
+++ b/source/index.txt
@@ -23,7 +23,7 @@ integration between MongoDB and Apache Spark.
    `MongoDB announcement blog post <https://www.mongodb.com/blog/post/new-mongodb-spark-connector>`__.
 
 With the connector, you have access to all Spark libraries for use with
-MongoDB datasets: Datasets for analysis with SQL (benefiting from
+MongoDB datasets: ``Dataset`` for analysis with SQL (benefiting from
 automatic schema inference), streaming, machine learning, and graph
 APIs. You can also use the connector with the Spark Shell.
 
diff --git a/source/java/read-from-mongodb.txt b/source/java/read-from-mongodb.txt
index b3bfa100..a241bec8 100644
--- a/source/java/read-from-mongodb.txt
+++ b/source/java/read-from-mongodb.txt
@@ -1,5 +1,5 @@
 To read data from MongoDB, call the ``read()`` method on your
-DataFrame object. This method returns a
+``SparkSession`` object. This method returns a
 ``DataFrameReader`` object, which you can use to specify the format and other
 configuration settings for your batch read operation. 
 
diff --git a/source/java/schema-inference.rst b/source/java/schema-inference.rst
index 06b1475b..e2c75d16 100644
--- a/source/java/schema-inference.rst
+++ b/source/java/schema-inference.rst
@@ -10,8 +10,8 @@
                                  .option("collection", "contacts")
                                  .load();
 
-To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
-the following example:
+To see the inferred schema, use the ``printSchema()`` method on your ``Dataset<Row>``
+object, as shown in the following example:
 
 .. io-code-block::
    :copyable: true
@@ -31,8 +31,8 @@ the following example:
        |-- age: integer (nullable = true)
        |-- name: string (nullable = true)
  
-To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
-the following example:
+To see the data in the DataFrame, use the ``show()`` method on your ``DataFrame`` object,
+as shown in the following example:
 
 .. io-code-block::
    :copyable: true
diff --git a/source/java/write-to-mongodb.txt b/source/java/write-to-mongodb.txt
index 0b3b29df..c47d9225 100644
--- a/source/java/write-to-mongodb.txt
+++ b/source/java/write-to-mongodb.txt
@@ -1,5 +1,5 @@
 To write data to MongoDB, call the ``write()`` method on your
-DataFrame object. This method returns a
+``Dataset<Row>`` object. This method returns a
 ``DataFrameWriter``
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
diff --git a/source/python/filters.txt b/source/python/filters.txt
index 4a4bcdf8..55022cd2 100644
--- a/source/python/filters.txt
+++ b/source/python/filters.txt
@@ -4,7 +4,7 @@ Use ``filter()`` to read a subset of data from your MongoDB collection.
 
 .. include:: /includes/example-load-dataframe.rst
 
-First, set up a DataFrame to connect with your default MongoDB data
+First, set up a ``DataFrame`` object to connect with your default MongoDB data
 source:
 
 .. code-block:: python
diff --git a/source/python/read-from-mongodb.txt b/source/python/read-from-mongodb.txt
index ce8b0a59..aa6f7958 100644
--- a/source/python/read-from-mongodb.txt
+++ b/source/python/read-from-mongodb.txt
@@ -1,5 +1,5 @@
 To read data from MongoDB, call the ``read`` function on your
-DataFrame object. This function returns a
+``SparkSession`` object. This function returns a
 ``DataFrameReader``
 object, which you can use to specify the format and other configuration settings for your
 batch read operation. 
diff --git a/source/python/schema-inference.rst b/source/python/schema-inference.rst
index 69f4fae2..c66e2858 100644
--- a/source/python/schema-inference.rst
+++ b/source/python/schema-inference.rst
@@ -10,8 +10,8 @@
                     .option("collection", "contacts")
                     .load()
 
-To see the inferred schema, use the ``dataFrame.printSchema()`` function, as shown in
-the following example:
+To see the inferred schema, use the ``printSchema()`` function on your ``DataFrame``
+object, as shown in the following example:
 
 .. io-code-block::
    :copyable: true
@@ -31,8 +31,8 @@ the following example:
        |-- age: integer (nullable = true)
        |-- name: string (nullable = true)
  
-To see the data in the DataFrame, use the ``dataFrame.show()`` function, as shown in
-the following example:
+To see the data in the DataFrame, use the ``show()`` function on your ``DataFrame``
+object, as shown in the following example:
 
 .. io-code-block::
    :copyable: true
diff --git a/source/python/write-to-mongodb.txt b/source/python/write-to-mongodb.txt
index fdf8519b..61beb5f9 100644
--- a/source/python/write-to-mongodb.txt
+++ b/source/python/write-to-mongodb.txt
@@ -1,5 +1,5 @@
 To write data to MongoDB, call the ``write`` function on your
-DataFrame object. This function returns a
+``DataFrame`` object. This function returns a
 ``DataFrameWriter``
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
@@ -7,8 +7,8 @@ batch write operation.
 .. include:: /includes/batch-write-settings.rst
 
 The following example uses the ``createDataFrame()`` function on the ``SparkSession``
-object to create a DataFrame from a list of tuples containing names
-and ages and a list of column names. The example then writes this DataFrame to the
+object to create a ``DataFrame`` object from a list of tuples containing names
+and ages and a list of column names. The example then writes this ``DataFrame`` to the
 ``people.contacts`` collection in MongoDB.
 
 .. code-block:: python
diff --git a/source/scala/api.txt b/source/scala/api.txt
index 22826d7e..760cc938 100644
--- a/source/scala/api.txt
+++ b/source/scala/api.txt
@@ -10,8 +10,8 @@ When starting the Spark shell, specify:
 Import the MongoDB Connector Package
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Enable MongoDB Connector specific functions and implicits for your
-``SparkSession`` and Datasets by importing the following 
+Enable MongoDB Connector-specific functions and implicits for your
+``SparkSession`` and ``Dataset`` objects by importing the following 
 package in the Spark shell:
 
 .. code-block:: scala
@@ -21,7 +21,7 @@ package in the Spark shell:
 Connect to MongoDB
 ~~~~~~~~~~~~~~~~~~
 
-Connection to MongoDB happens automatically when a Dataset 
+Connection to MongoDB happens automatically when a Dataset
 action requires a read from MongoDB or a
 write to MongoDB.
 
diff --git a/source/scala/read-from-mongodb.txt b/source/scala/read-from-mongodb.txt
index 8e1cc04a..0ca38aa8 100644
--- a/source/scala/read-from-mongodb.txt
+++ b/source/scala/read-from-mongodb.txt
@@ -1,5 +1,5 @@
 To read data from MongoDB, call the ``read`` method on your
-DataFrame object. This method returns a
+``SparkSession`` object. This method returns a
 ``DataFrameReader``
 object, which you can use to specify the format and other configuration settings for your
 batch read operation. 
@@ -19,5 +19,5 @@ configuration settings to read data from ``people.contacts`` in MongoDB:
 
 .. tip:: DataFrame Type
    
-   A DataFrame is a Dataset of ``Row`` objects.
+   A DataFrame is represented by a ``Dataset`` of ``Row`` objects.
    The ``DataFrame`` type is an alias for ``Dataset[Row]``.
diff --git a/source/scala/schema-inference.rst b/source/scala/schema-inference.rst
index 1f961631..8bc3e18c 100644
--- a/source/scala/schema-inference.rst
+++ b/source/scala/schema-inference.rst
@@ -10,8 +10,8 @@
                         .option("collection", "contacts")
                         .load()
 
-To see the inferred schema, use the ``dataFrame.printSchema()`` method, as shown in
-the following example:
+To see the inferred schema, use the ``printSchema()`` method on your ``DataFrame``
+object, as shown in the following example:
 
 .. io-code-block::
    :copyable: true
@@ -31,8 +31,8 @@ the following example:
        |-- age: integer (nullable = true)
        |-- name: string (nullable = true)
  
-To see the data in the DataFrame, use the ``dataFrame.show()`` method, as shown in
-the following example:
+To see the data in the DataFrame, use the ``show()`` method on your ``DataFrame`` object,
+as shown in the following example:
 
 .. io-code-block::
    :copyable: true
diff --git a/source/scala/write-to-mongodb.txt b/source/scala/write-to-mongodb.txt
index 5af9c387..d07ba358 100644
--- a/source/scala/write-to-mongodb.txt
+++ b/source/scala/write-to-mongodb.txt
@@ -1,5 +1,5 @@
 To write data to MongoDB, call the ``write()`` method on your
-DataFrame object. This method returns a
+``DataFrame`` object. This method returns a
 ``DataFrameWriter``
 object, which you can use to specify the format and other configuration settings for your
 batch write operation. 
diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index cc3032a5..79c355c5 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -179,7 +179,7 @@ The following example shows how to stream data from MongoDB to your console.
          #. Create a 
             ``DataStreamWriter`` object
             by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
+            ``Dataset`` object that you created with a 
             ``DataStreamReader``. Specify the format ``console`` using 
             the ``format()`` method.
 
@@ -234,8 +234,8 @@ The following example shows how to stream data from MongoDB to your console.
          #. Create a 
             ``DataStreamWriter`` object
             by calling the ``writeStream()`` method on the streaming 
-            DataFrame that you created with a ``DataStreamReader``. 
-            Specify the format ``console`` using the ``format()`` method.
+            ``DataFrame`` that you created with a ``DataStreamReader``. 
+            Specify the format ``console`` by using the ``format()`` method.
 
          #. Call the ``start()`` method on the ``DataStreamWriter``
             instance to begin the stream.
@@ -291,8 +291,8 @@ The following example shows how to stream data from MongoDB to your console.
          #. Create a 
             ``DataStreamWriter`` object
             by calling the ``writeStream()`` method on the streaming 
-            Dataset or streaming DataFrame that you created with a 
-            ``DataStreamReader``. Specify the format ``console`` using 
+            ``DataFrame`` object that you created by using the
+            ``DataStreamReader``. Specify the format ``console`` by using 
             the ``format()`` method.
 
          #. Call the ``start()`` method on the ``DataStreamWriter``
@@ -363,7 +363,7 @@ API documentation:
      - id: java-sync
        content: |
 
-         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `Dataset<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
          - `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
          - `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
      
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index ba4e5f19..f21755b1 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -17,7 +17,7 @@ Write to MongoDB in Streaming Mode
        content: |
 
          To write data to MongoDB, call the ``writeStream()`` method on your
-         DataFrame object. This method returns a
+         ``Dataset`` object. This method returns a
          ``DataStreamWriter``
          object, which you can use to specify the format and other configuration settings
          for your streaming write operation. 
@@ -85,7 +85,7 @@ Write to MongoDB in Streaming Mode
        content: |
 
          To write data to MongoDB, call the ``writeStream`` function on your
-         DataFrame object. This function returns a
+         ``DataFrame`` object. This function returns a
          ``DataStreamWriter``
          object, which you can use to specify the format and other configuration settings for your
          streaming write operation. 
@@ -152,7 +152,7 @@ Write to MongoDB in Streaming Mode
        content: |
 
          To write data to MongoDB, call the ``write`` method on your
-         DataFrame object. This method returns a
+         ``DataFrame`` object. This method returns a
          ``DataStreamWriter``
          object, which you can use to specify the format and other configuration settings
          for your streaming write operation. 
@@ -232,7 +232,7 @@ file to MongoDB:
          1. Create a ``DataStreamReader`` object that reads from the CSV file.
 
          #. To create a ``DataStreamWriter`` object, call the ``writeStream()`` method
-            on the streaming DataFrame that you created with the
+            on the streaming ``Dataset<Row>`` that you created with the
             ``DataStreamReader``. Use the ``format()`` method to specify ``mongodb`` as
             the underlying data format.
 
@@ -277,7 +277,7 @@ file to MongoDB:
          1. Create a ``DataStreamReader`` object that reads from the CSV file.
 
          #. To create a ``DataStreamWriter`` object, call the ``writeStream`` function
-            on the streaming DataFrame that you created with the
+            on the streaming ``DataFrame`` that you created with the
             ``DataStreamReader``. Use the ``format()`` function to specify ``mongodb`` as
             the underlying data format.
          
@@ -323,7 +323,7 @@ file to MongoDB:
          1. Create a ``DataStreamReader`` object that reads from the CSV file.
 
          #. To create a ``DataStreamWriter`` object, call the ``writeStream`` method
-            on the streaming DataFrame that you created with the
+            on the streaming ``DataFrame`` that you created with the
             ``DataStreamReader``. Use the ``format()`` method to specify ``mongodb`` as
             the underlying data format.
          
@@ -374,7 +374,7 @@ API documentation:
      - id: java-sync
        content: |
 
-         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `Dataset<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
          - `DataStreamReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamReader.html>`__ 
          - `DataStreamWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/streaming/DataStreamWriter.html>`__
      

From a70c300705352e81e66901009966776ea932b8b3 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 14 Nov 2023 10:44:41 -0600
Subject: [PATCH 62/65] js feedback

---
 source/batch-mode/batch-read.txt  | 2 +-
 source/batch-mode/batch-write.txt | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/source/batch-mode/batch-read.txt b/source/batch-mode/batch-read.txt
index cacad3f9..1da915e4 100644
--- a/source/batch-mode/batch-read.txt
+++ b/source/batch-mode/batch-read.txt
@@ -107,7 +107,7 @@ API documentation:
      - id: java-sync
        content: |
 
-         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `Dataset<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
          - `DataFrameReader <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameReader.html>`__
 
      - id: python
diff --git a/source/batch-mode/batch-write.txt b/source/batch-mode/batch-write.txt
index fbddb8e6..0730ed66 100644
--- a/source/batch-mode/batch-write.txt
+++ b/source/batch-mode/batch-write.txt
@@ -72,7 +72,7 @@ API documentation:
      - id: java-sync
        content: |
 
-         - `DataSet<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
+         - `Dataset<T> <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/Dataset.html>`__
          - `DataFrameWriter <https://spark.apache.org/docs/latest/api/java/org/apache/spark/sql/DataFrameWriter.html>`__
 
      - id: python

From 5be820d169a195e5db8adaf3f6af76ecff75dcd8 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 14 Nov 2023 11:00:02 -0600
Subject: [PATCH 63/65] js feedback

---
 source/includes/note-trigger-method.rst   | 2 +-
 source/streaming-mode/streaming-write.txt | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/source/includes/note-trigger-method.rst b/source/includes/note-trigger-method.rst
index 747f11fc..f9ad2d1d 100644
--- a/source/includes/note-trigger-method.rst
+++ b/source/includes/note-trigger-method.rst
@@ -1,4 +1,4 @@
 .. note::
 
-   Call the ``trigger`` method on the ``DataStreamWriter`` you create 
+   Call the ``trigger()`` method on the ``DataStreamWriter`` you create 
    from the ``DataStreamReader`` you configure.
diff --git a/source/streaming-mode/streaming-write.txt b/source/streaming-mode/streaming-write.txt
index f21755b1..60a6aa3f 100644
--- a/source/streaming-mode/streaming-write.txt
+++ b/source/streaming-mode/streaming-write.txt
@@ -17,7 +17,7 @@ Write to MongoDB in Streaming Mode
        content: |
 
          To write data to MongoDB, call the ``writeStream()`` method on your
-         ``Dataset`` object. This method returns a
+         ``Dataset<Row>`` object. This method returns a
          ``DataStreamWriter``
          object, which you can use to specify the format and other configuration settings
          for your streaming write operation. 

From 949a40b31f8b33cf04827a419d326f361b851ae6 Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 14 Nov 2023 11:21:19 -0600
Subject: [PATCH 64/65] js feedback

---
 source/streaming-mode/streaming-read.txt | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/source/streaming-mode/streaming-read.txt b/source/streaming-mode/streaming-read.txt
index 79c355c5..d7433cc7 100644
--- a/source/streaming-mode/streaming-read.txt
+++ b/source/streaming-mode/streaming-read.txt
@@ -20,10 +20,14 @@ Overview
 
 When reading a stream from a MongoDB database, the {+connector-long+} supports both 
 *micro-batch processing* and 
-*continuous processing*. Micro-batch processing is the default processing engine, while
-continuous processing is an experimental feature introduced in 
-Spark version 2.3. To learn 
-more about continuous processing, see the `Spark documentation <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#continuous-processing>`__.
+*continuous processing*. Micro-batch processing, the default processing engine, achieves
+end-to-end latencies as low as 100 milliseconds with exactly-once fault-tolerance
+guarantees. Continuous processing is an experimental feature introduced in 
+Spark version 2.3 that achieves end-to-end latencies as low as 1 millisecond with
+at-least-once guarantees.
+
+To learn more about continuous processing, see the
+`Spark documentation <https://spark.apache.org/docs/latest/structured-streaming-programming-guide.html#continuous-processing>`__.
 
 .. include:: /includes/fact-read-from-change-stream
 

From 68c74247c7ba18b21a53da209153cea4dcc59a8e Mon Sep 17 00:00:00 2001
From: Mike Woofter <mike.woofter@mongodb.com>
Date: Tue, 14 Nov 2023 11:28:40 -0600
Subject: [PATCH 65/65] fixes

---
 source/batch-mode/batch-read-config.txt          | 3 +++
 source/batch-mode/batch-write-config.txt         | 6 ++++++
 source/includes/connection-read-config.rst       | 3 ---
 source/includes/connection-write-config.rst      | 4 ----
 source/streaming-mode/streaming-read-config.txt  | 6 ++++++
 source/streaming-mode/streaming-write-config.txt | 6 ++++++
 6 files changed, 21 insertions(+), 7 deletions(-)

diff --git a/source/batch-mode/batch-read-config.txt b/source/batch-mode/batch-read-config.txt
index 9de489a1..fbf2e593 100644
--- a/source/batch-mode/batch-read-config.txt
+++ b/source/batch-mode/batch-read-config.txt
@@ -285,4 +285,7 @@ The ``SinglePartitionPartitioner`` configuration creates a single partition.
 To use this configuration, set the ``partitioner`` configuration option to
 ``com.mongodb.spark.sql.connector.read.partitioner.SinglePartitionPartitioner``.
 
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
 .. include:: /includes/connection-read-config.rst
\ No newline at end of file
diff --git a/source/batch-mode/batch-write-config.txt b/source/batch-mode/batch-write-config.txt
index c135177f..4d8361d1 100644
--- a/source/batch-mode/batch-write-config.txt
+++ b/source/batch-mode/batch-write-config.txt
@@ -12,6 +12,9 @@ Batch Write Configuration Options
 
 .. _spark-batch-output-conf:
 
+Overview
+--------
+
 You can configure the following properties when writing data to MongoDB in batch mode.
 
 .. include:: /includes/conf-write-prefix.rst
@@ -161,4 +164,7 @@ You can configure the following properties when writing data to MongoDB in batch
          guide on the
          :manual:`WriteConcern wtimeout option </reference/write-concern/#wtimeout>`.
 
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
 .. include:: /includes/connection-write-config.rst
diff --git a/source/includes/connection-read-config.rst b/source/includes/connection-read-config.rst
index 53c826c5..04c0d3e6 100644
--- a/source/includes/connection-read-config.rst
+++ b/source/includes/connection-read-config.rst
@@ -1,6 +1,3 @@
-Specifying Properties in ``connection.uri``
--------------------------------------------
-
 If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you can
 either include them in the ``connection.uri`` setting or list them individually.
 
diff --git a/source/includes/connection-write-config.rst b/source/includes/connection-write-config.rst
index d47a47e4..892a63df 100644
--- a/source/includes/connection-write-config.rst
+++ b/source/includes/connection-write-config.rst
@@ -1,6 +1,3 @@
-Specifying Properties in ``connection.uri``
--------------------------------------------
-
 If you use :ref:`SparkConf <spark-conf>` to specify any of the previous settings, you can
 either include them in the ``connection.uri`` setting or list them individually.
 
@@ -12,7 +9,6 @@ setting:
 
   spark.mongodb.write.connection.uri=mongodb://127.0.0.1/myDB.myCollection?convertJson=any
 
-
 To keep the ``connection.uri`` shorter and make the settings easier to read, you can
 specify them individually instead:
 
diff --git a/source/streaming-mode/streaming-read-config.txt b/source/streaming-mode/streaming-read-config.txt
index 2f1916b3..a81330d2 100644
--- a/source/streaming-mode/streaming-read-config.txt
+++ b/source/streaming-mode/streaming-read-config.txt
@@ -12,6 +12,9 @@ Streaming Read Configuration Options
 
 .. _spark-streaming-input-conf:
 
+Overview
+--------
+
 You can configure the following properties when reading data from MongoDB in streaming mode.
 
 .. include:: /includes/conf-read-prefix.rst
@@ -185,4 +188,7 @@ You can configure the following properties when reading a change stream from Mon
        
          **Default**: ``latest``
  
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
 .. include:: /includes/connection-read-config.rst
\ No newline at end of file
diff --git a/source/streaming-mode/streaming-write-config.txt b/source/streaming-mode/streaming-write-config.txt
index db8242f6..4b540b4e 100644
--- a/source/streaming-mode/streaming-write-config.txt
+++ b/source/streaming-mode/streaming-write-config.txt
@@ -12,6 +12,9 @@ Streaming Write Configuration Options
 
 .. _spark-streaming-output-conf:
 
+Overview
+--------
+
 You can configure the following properties when writing data to MongoDB in streaming mode.
 
 .. include:: /includes/conf-write-prefix.rst
@@ -65,4 +68,7 @@ You can configure the following properties when writing data to MongoDB in strea
        |
        | **Default:** ``false`` 
 
+Specifying Properties in ``connection.uri``
+-------------------------------------------
+
 .. include:: /includes/connection-write-config.rst