Merge pull request #113 from marklogic/feature/docs-update

rjrudin · web-flow · commit a399ccebf5f2 · 2023-11-16T17:24:52.000-05:00
Updating docs for 2.1.0
diff --git a/docs/getting-started/jupyter.md b/docs/getting-started/jupyter.md
@@ -32,15 +32,15 @@ connector and also to initialize Spark:
 
 ```
 import os
-os.environ['PYSPARK_SUBMIT_ARGS'] = '--jars "/path/to/marklogic-spark-connector-2.0.0.jar" pyspark-shell'
+os.environ['PYSPARK_SUBMIT_ARGS'] = '--jars "/path/to/marklogic-spark-connector-2.1.0.jar" pyspark-shell'
 
 from pyspark.sql import SparkSession
 spark = SparkSession.builder.master("local[*]").appName('My Notebook').getOrCreate()
 spark.sparkContext.setLogLevel("WARN")
 spark
 ```
 
-The path of `/path/to/marklogic-spark-connector-2.0.0.jar` should be changed to match the location of the connector 
+The path of `/path/to/marklogic-spark-connector-2.1.0.jar` should be changed to match the location of the connector 
 jar on your filesystem. You are free to customize the `spark` variable in any manner you see fit as well. 
 
 Now that you have an initialized Spark session, you can run any of the examples found in the 
diff --git a/docs/getting-started/pyspark.md b/docs/getting-started/pyspark.md
@@ -29,7 +29,7 @@ shell by pressing `ctrl-D`.
 
 Run PySpark from the directory that you downloaded the connector to per the [setup instructions](setup.md):
 
-    pyspark --jars marklogic-spark-connector-2.0.0.jar
+    pyspark --jars marklogic-spark-connector-2.1.0.jar
 
 The `--jars` command line option is PySpark's method for utilizing Spark connectors. Each Spark environment should have
 a similar mechanism for including third party connectors; please see the documentation for your particular Spark
diff --git a/docs/reading.md b/docs/reading.md
@@ -284,6 +284,10 @@ useful when you need to retrieve data that cannot be easily accessed via Optic,
 to that of [MarkLogic's CoRB tool](https://github.com/marklogic-community/corb2) for processing data already in 
 MarkLogic. 
 
+When using this feature, please ensure that your MarkLogic user has the required privileges for the 
+MarkLogic REST [eval endpoint](https://docs.marklogic.com/REST/POST/v1/eval) and 
+[invoke endpoint](https://docs.marklogic.com/REST/POST/v1/invoke).
+
 Custom code can be [written in JavaScript](https://docs.marklogic.com/guide/getting-started/javascript) by 
 configuring the `spark.marklogic.read.javascript` option:
 
diff --git a/docs/writing.md b/docs/writing.md
@@ -189,6 +189,10 @@ To easily support that use case, the connector defaults to assuming that each ro
 column named "URI" of type string. This matches the convention for reading rows via custom code, which defaults to the
 same schema. User-defined custom code is then expected to declare an external variable named "URI".
 
+When using this feature, please ensure that your MarkLogic user has the required privileges for the
+MarkLogic REST [eval endpoint](https://docs.marklogic.com/REST/POST/v1/eval) and
+[invoke endpoint](https://docs.marklogic.com/REST/POST/v1/invoke).
+
 The following shows an example of reading and processing rows via custom code specified by 
 `spark.marklogic.write.javascript`, where each row is expected to have a single column named "URI" (the script for
 reading rows only returns the first 10 URIs to make it easier to verify that the correct data is logged; you can
diff --git a/examples/entity-aggregation/build.gradle b/examples/entity-aggregation/build.gradle
@@ -7,8 +7,8 @@ repositories {
 }
 
 dependencies {
-  implementation 'org.apache.spark:spark-sql_2.12:3.3.2'
-  implementation "com.marklogic:marklogic-spark-connector:2.0.0"
+  implementation 'org.apache.spark:spark-sql_2.12:3.4.1'
+  implementation "com.marklogic:marklogic-spark-connector:2.1.0"
   implementation "org.postgresql:postgresql:42.6.0"
 }
 
diff --git a/examples/getting-started/build.gradle b/examples/getting-started/build.gradle
@@ -1,6 +1,6 @@
 plugins {
   id 'net.saliman.properties' version '1.5.2'
-  id "com.marklogic.ml-gradle" version "4.5.1"
+  id "com.marklogic.ml-gradle" version "4.6.0"
 }
 
 repositories {
diff --git a/examples/getting-started/gradle/wrapper/gradle-wrapper.properties b/examples/getting-started/gradle/wrapper/gradle-wrapper.properties
@@ -1,5 +1,5 @@
 distributionBase=GRADLE_USER_HOME
 distributionPath=wrapper/dists
-distributionUrl=https\://services.gradle.org/distributions/gradle-7.5.1-bin.zip
+distributionUrl=https\://services.gradle.org/distributions/gradle-8.4-bin.zip
 zipStoreBase=GRADLE_USER_HOME
 zipStorePath=wrapper/dists
diff --git a/examples/getting-started/marklogic-spark-getting-started.ipynb b/examples/getting-started/marklogic-spark-getting-started.ipynb
@@ -53,7 +53,7 @@
    "source": [
     "# Make the MarkLogic connector available to the underlying PySpark application.\n",
     "import os\n",
-    "os.environ['PYSPARK_SUBMIT_ARGS'] = '--jars \"marklogic-spark-connector-2.0.0.jar\" pyspark-shell'\n",
+    "os.environ['PYSPARK_SUBMIT_ARGS'] = '--jars \"marklogic-spark-connector-2.1.0.jar\" pyspark-shell'\n",
     "\n",
     "# Define the connection details for the getting-started example application.\n",
     "client_uri = \"spark-example-user:password@localhost:8003\"\n",
diff --git a/examples/java-dependency/build.gradle b/examples/java-dependency/build.gradle
@@ -3,13 +3,12 @@ plugins {
 }
 
 repositories {
-  mavenLocal()
   mavenCentral()
 }
 
 dependencies {
   implementation 'org.apache.spark:spark-sql_2.12:3.4.1'
-  implementation 'com.marklogic:marklogic-spark-connector:2.1-SNAPSHOT'
+  implementation 'com.marklogic:marklogic-spark-connector:2.1.0'
 }
 
 task runApp(type: JavaExec) {

Original file line number	Diff line number	Diff line change
`@@ -7,8 +7,8 @@ repositories {`
`7`	`7`	`}`
`8`	`8`
`9`	`9`	`dependencies {`
`10`		`- implementation 'org.apache.spark:spark-sql_2.12:3.3.2'`
`11`		`- implementation "com.marklogic:marklogic-spark-connector:2.0.0"`
	`10`	`+ implementation 'org.apache.spark:spark-sql_2.12:3.4.1'`
	`11`	`+ implementation "com.marklogic:marklogic-spark-connector:2.1.0"`
`12`	`12`	`implementation "org.postgresql:postgresql:42.6.0"`
`13`	`13`	`}`
`14`	`14`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`plugins {`
`2`	`2`	`id 'net.saliman.properties' version '1.5.2'`
`3`		`- id "com.marklogic.ml-gradle" version "4.5.1"`
	`3`	`+ id "com.marklogic.ml-gradle" version "4.6.0"`
`4`	`4`	`}`
`5`	`5`
`6`	`6`	`repositories {`
Original file line number	Diff line number	Diff line change
`@@ -3,13 +3,12 @@ plugins {`
`3`	`3`	`}`
`4`	`4`
`5`	`5`	`repositories {`
`6`		`- mavenLocal()`
`7`	`6`	`mavenCentral()`
`8`	`7`	`}`
`9`	`8`
`10`	`9`	`dependencies {`
`11`	`10`	`implementation 'org.apache.spark:spark-sql_2.12:3.4.1'`
`12`		`- implementation 'com.marklogic:marklogic-spark-connector:2.1-SNAPSHOT'`
	`11`	`+ implementation 'com.marklogic:marklogic-spark-connector:2.1.0'`
`13`	`12`	`}`
`14`	`13`
`15`	`14`	`task runApp(type: JavaExec) {`