diff --git a/.github/workflows/generate_docs.yml b/.github/workflows/generate_docs.yml
new file mode 100644
index 00000000..9ca5d938
--- /dev/null
+++ b/.github/workflows/generate_docs.yml
@@ -0,0 +1,25 @@
+name: Generate and publish docs
+
+on:
+  push:
+    branches:
+      - "spark-3.2"
+  pull_request:
+    branches:
+      - "spark-3.2"
+
+jobs:
+  generate-and-publish-docs:
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v2
+      - name: Set up JDK 11
+        uses: actions/setup-java@v1
+        with:
+          distributions: adopt
+          java-version: 11
+          check-latest: true
+      - name: Generate docs
+        run: ./mvnw clean package site -Dmaven.test.skip=true
+        # TODO create branch and copy the docs over from kotlin-spark-api/3.2/target/dokka
\ No newline at end of file
diff --git a/README.md b/README.md
index f090f0cf..79c669e4 100644
--- a/README.md
+++ b/README.md
@@ -1,4 +1,4 @@
-# Kotlin for Apache® Spark™ [![Maven Central](https://img.shields.io/maven-central/v/org.jetbrains.kotlinx.spark/kotlin-spark-api-parent.svg?label=Maven%20Central)](https://search.maven.org/search?q=g:org.jetbrains.kotlinx.spark%20AND%20v:1.0.2) [![official JetBrains project](http://jb.gg/badges/incubator.svg)](https://confluence.jetbrains.com/display/ALL/JetBrains+on+GitHub)
+# Kotlin for Apache® Spark™ [![Maven Central](https://img.shields.io/maven-central/v/org.jetbrains.kotlinx.spark/kotlin-spark-api-parent.svg?label=Maven%20Central)](https://search.maven.org/search?q=g:org.jetbrains.kotlinx.spark%20AND%20v:1.0.2) [![official JetBrains project](http://jb.gg/badges/official.svg)](https://confluence.jetbrains.com/display/ALL/JetBrains+on+GitHub)
 
 
 Your next API to work with  [Apache Spark](https://spark.apache.org/). 
diff --git a/kotlin-spark-api/3.2/pom_2.12.xml b/kotlin-spark-api/3.2/pom_2.12.xml
index 7195f912..756d9c2b 100644
--- a/kotlin-spark-api/3.2/pom_2.12.xml
+++ b/kotlin-spark-api/3.2/pom_2.12.xml
@@ -27,10 +27,7 @@
       <groupId>org.jetbrains.kotlinx.spark</groupId>
       <artifactId>core-3.2_${scala.compat.version}</artifactId>
     </dependency>
-    <dependency>
-      <groupId>org.jetbrains.kotlinx.spark</groupId>
-      <artifactId>kotlin-spark-api-common</artifactId>
-    </dependency>
+
 
     <!-- Provided dependencies -->
     <dependency>
diff --git a/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/ApiV1.kt b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/ApiV1.kt
index 32935f40..e679f561 100644
--- a/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/ApiV1.kt
+++ b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/ApiV1.kt
@@ -21,6 +21,7 @@
 
 package org.jetbrains.kotlinx.spark.api
 
+import org.apache.hadoop.shaded.org.apache.commons.math3.exception.util.ArgUtils
 import org.apache.spark.SparkContext
 import org.apache.spark.api.java.JavaSparkContext
 import org.apache.spark.api.java.function.*
@@ -36,6 +37,7 @@ import org.jetbrains.kotlinx.spark.extensions.KSparkExtensions
 import scala.Product
 import scala.Tuple2
 import scala.reflect.ClassTag
+import scala.reflect.api.TypeTags.TypeTag
 import java.beans.PropertyDescriptor
 import java.math.BigDecimal
 import java.sql.Date
@@ -82,7 +84,7 @@ import kotlin.reflect.full.primaryConstructor
 import kotlin.to
 
 @JvmField
-val ENCODERS = mapOf<KClass<*>, Encoder<*>>(
+val ENCODERS: Map<KClass<*>, Encoder<*>> = mapOf(
     Boolean::class to BOOLEAN(),
     Byte::class to BYTE(),
     Short::class to SHORT(),
@@ -164,6 +166,9 @@ inline fun <reified T> List<T>.toDS(spark: SparkSession): Dataset<T> =
 @OptIn(ExperimentalStdlibApi::class)
 inline fun <reified T> encoder(): Encoder<T> = generateEncoder(typeOf<T>(), T::class)
 
+/**
+ * @see encoder
+ */
 fun <T> generateEncoder(type: KType, cls: KClass<*>): Encoder<T> {
     @Suppress("UNCHECKED_CAST")
     return when {
@@ -172,7 +177,8 @@ fun <T> generateEncoder(type: KType, cls: KClass<*>): Encoder<T> {
     } as Encoder<T>
 }
 
-private fun isSupportedClass(cls: KClass<*>): Boolean = cls.isData
+private fun isSupportedClass(cls: KClass<*>): Boolean =
+    cls.isData
         || cls.isSubclassOf(Map::class)
         || cls.isSubclassOf(Iterable::class)
         || cls.isSubclassOf(Product::class)
@@ -192,30 +198,89 @@ private fun <T> kotlinClassEncoder(schema: DataType, kClass: KClass<*>): Encoder
     )
 }
 
+/**
+ * (Kotlin-specific)
+ * Returns a new Dataset that contains the result of applying [func] to each element.
+ */
 inline fun <reified T, reified R> Dataset<T>.map(noinline func: (T) -> R): Dataset<R> =
     map(MapFunction(func), encoder<R>())
 
+/**
+ * (Kotlin-specific)
+ * Returns a new Dataset by first applying a function to all elements of this Dataset,
+ * and then flattening the results.
+ */
 inline fun <T, reified R> Dataset<T>.flatMap(noinline func: (T) -> Iterator<R>): Dataset<R> =
     flatMap(func, encoder<R>())
 
+/**
+ * (Kotlin-specific)
+ * Returns a new Dataset by flattening. This means that a Dataset of an iterable such as
+ * `listOf(listOf(1, 2, 3), listOf(4, 5, 6))` will be flattened to a Dataset of `listOf(1, 2, 3, 4, 5, 6)`.
+ */
 inline fun <reified T, I : Iterable<T>> Dataset<I>.flatten(): Dataset<T> =
     flatMap(FlatMapFunction { it.iterator() }, encoder<T>())
 
+/**
+ * (Kotlin-specific)
+ * Returns a [KeyValueGroupedDataset] where the data is grouped by the given key [func].
+ */
 inline fun <T, reified R> Dataset<T>.groupByKey(noinline func: (T) -> R): KeyValueGroupedDataset<R, T> =
     groupByKey(MapFunction(func), encoder<R>())
 
+/**
+ * (Kotlin-specific)
+ * Returns a new Dataset that contains the result of applying [func] to each partition.
+ */
 inline fun <T, reified R> Dataset<T>.mapPartitions(noinline func: (Iterator<T>) -> Iterator<R>): Dataset<R> =
     mapPartitions(func, encoder<R>())
 
+/**
+ * (Kotlin-specific)
+ * Filters rows to eliminate [null] values.
+ */
 @Suppress("UNCHECKED_CAST")
 fun <T : Any> Dataset<T?>.filterNotNull(): Dataset<T> = filter { it != null } as Dataset<T>
 
+/**
+ * Returns a new [KeyValueGroupedDataset] where the given function [func] has been applied
+ * to the data. The grouping key is unchanged by this.
+ *
+ * ```kotlin
+ *   // Create values grouped by key from a Dataset<Arity2<K, V>>
+ *   ds.groupByKey { it._1 }.mapValues { it._2 }
+ * ```
+ */
 inline fun <KEY, VALUE, reified R> KeyValueGroupedDataset<KEY, VALUE>.mapValues(noinline func: (VALUE) -> R): KeyValueGroupedDataset<KEY, R> =
     mapValues(MapFunction(func), encoder<R>())
 
+/**
+ * (Kotlin-specific)
+ * Applies the given function to each group of data. For each unique group, the function will
+ * be passed the group key and an iterator that contains all the elements in the group. The
+ * function can return an element of arbitrary type which will be returned as a new [Dataset].
+ *
+ * This function does not support partial aggregation, and as a result requires shuffling all
+ * the data in the [Dataset]. If an application intends to perform an aggregation over each
+ * key, it is best to use the reduce function or an
+ * [org.apache.spark.sql.expressions.Aggregator].
+ *
+ * Internally, the implementation will spill to disk if any given group is too large to fit into
+ * memory.  However, users must take care to avoid materializing the whole iterator for a group
+ * (for example, by calling [toList]) unless they are sure that this is possible given the memory
+ * constraints of their cluster.
+ */
 inline fun <KEY, VALUE, reified R> KeyValueGroupedDataset<KEY, VALUE>.mapGroups(noinline func: (KEY, Iterator<VALUE>) -> R): Dataset<R> =
     mapGroups(MapGroupsFunction(func), encoder<R>())
 
+/**
+ * (Kotlin-specific)
+ * Reduces the elements of each group of data using the specified binary function.
+ * The given function must be commutative and associative or the result may be non-deterministic.
+ *
+ * Note that you need to use [reduceGroupsK] always instead of the Java- or Scala-specific
+ * [KeyValueGroupedDataset.reduceGroups] to make the compiler work.
+ */
 inline fun <reified KEY, reified VALUE> KeyValueGroupedDataset<KEY, VALUE>.reduceGroupsK(noinline func: (VALUE, VALUE) -> VALUE): Dataset<Pair<KEY, VALUE>> =
     reduceGroups(ReduceFunction(func))
         .map { t -> t._1 to t._2 }
@@ -228,23 +293,63 @@ inline fun <reified KEY, reified VALUE> KeyValueGroupedDataset<KEY, VALUE>.reduc
 inline fun <reified T> Dataset<T>.reduceK(noinline func: (T, T) -> T): T =
     reduce(ReduceFunction(func))
 
+/**
+ * (Kotlin-specific)
+ * Maps the Dataset to only retain the "keys" or [Tuple2._1] values.
+ */
 @JvmName("takeKeysTuple2")
 inline fun <reified T1, T2> Dataset<Tuple2<T1, T2>>.takeKeys(): Dataset<T1> = map { it._1() }
 
+/**
+ * (Kotlin-specific)
+ * Maps the Dataset to only retain the "keys" or [Pair.first] values.
+ */
 inline fun <reified T1, T2> Dataset<Pair<T1, T2>>.takeKeys(): Dataset<T1> = map { it.first }
 
+/**
+ * (Kotlin-specific)
+ * Maps the Dataset to only retain the "keys" or [Arity2._1] values.
+ */
 @JvmName("takeKeysArity2")
 inline fun <reified T1, T2> Dataset<Arity2<T1, T2>>.takeKeys(): Dataset<T1> = map { it._1 }
 
+/**
+ * (Kotlin-specific)
+ * Maps the Dataset to only retain the "values" or [Tuple2._2] values.
+ */
 @JvmName("takeValuesTuple2")
 inline fun <T1, reified T2> Dataset<Tuple2<T1, T2>>.takeValues(): Dataset<T2> = map { it._2() }
 
+/**
+ * (Kotlin-specific)
+ * Maps the Dataset to only retain the "values" or [Pair.second] values.
+ */
 inline fun <T1, reified T2> Dataset<Pair<T1, T2>>.takeValues(): Dataset<T2> = map { it.second }
 
+/**
+ * (Kotlin-specific)
+ * Maps the Dataset to only retain the "values" or [Arity2._2] values.
+ */
 @JvmName("takeValuesArity2")
 inline fun <T1, reified T2> Dataset<Arity2<T1, T2>>.takeValues(): Dataset<T2> = map { it._2 }
 
-
+/**
+ * (Kotlin-specific)
+ * Applies the given function to each group of data. For each unique group, the function will
+ * be passed the group key and an iterator that contains all the elements in the group. The
+ * function can return an iterator containing elements of an arbitrary type which will be returned
+ * as a new [Dataset].
+ *
+ * This function does not support partial aggregation, and as a result requires shuffling all
+ * the data in the [Dataset]. If an application intends to perform an aggregation over each
+ * key, it is best to use the reduce function or an
+ * [org.apache.spark.sql.expressions.Aggregator].
+ *
+ * Internally, the implementation will spill to disk if any given group is too large to fit into
+ * memory.  However, users must take care to avoid materializing the whole iterator for a group
+ * (for example, by calling [toList]) unless they are sure that this is possible given the memory
+ * constraints of their cluster.
+ */
 inline fun <K, V, reified U> KeyValueGroupedDataset<K, V>.flatMapGroups(
     noinline func: (key: K, values: Iterator<V>) -> Iterator<U>,
 ): Dataset<U> = flatMapGroups(
@@ -252,12 +357,57 @@ inline fun <K, V, reified U> KeyValueGroupedDataset<K, V>.flatMapGroups(
     encoder<U>()
 )
 
+/**
+ * (Kotlin-specific)
+ * Returns the group state value if it exists, else [null].
+ * This is comparable to [GroupState.getOption], but instead utilises Kotlin's nullability features
+ * to get the same result.
+ */
 fun <S> GroupState<S>.getOrNull(): S? = if (exists()) get() else null
 
+/**
+ * (Kotlin-specific)
+ * Allows the group state object to be used as a delegate. Will be [null] if it does not exist.
+ *
+ * For example:
+ * ```kotlin
+ * groupedDataset.mapGroupsWithState(GroupStateTimeout.NoTimeout()) { key, values, state: GroupState<Int> ->
+ *     var s by state
+ *     ...
+ * }
+ * ```
+ */
 operator fun <S> GroupState<S>.getValue(thisRef: Any?, property: KProperty<*>): S? = getOrNull()
-operator fun <S> GroupState<S>.setValue(thisRef: Any?, property: KProperty<*>, value: S?): Unit = update(value)
 
+/**
+ * (Kotlin-specific)
+ * Allows the group state object to be used as a delegate. Will be [null] if it does not exist.
+ *
+ * For example:
+ * ```kotlin
+ * groupedDataset.mapGroupsWithState(GroupStateTimeout.NoTimeout()) { key, values, state: GroupState<Int> ->
+ *     var s by state
+ *     ...
+ * }
+ * ```
+ */
+operator fun <S> GroupState<S>.setValue(thisRef: Any?, property: KProperty<*>, value: S?): Unit = update(value)
 
+/**
+ * (Kotlin-specific)
+ * Applies the given function to each group of data, while maintaining a user-defined per-group
+ * state. The result Dataset will represent the objects returned by the function.
+ * For a static batch Dataset, the function will be invoked once per group. For a streaming
+ * Dataset, the function will be invoked for each group repeatedly in every trigger, and
+ * updates to each group's state will be saved across invocations.
+ * See [org.apache.spark.sql.streaming.GroupState] for more details.
+ *
+ * @param S The type of the user-defined state. Must be encodable to Spark SQL types.
+ * @param U The type of the output objects. Must be encodable to Spark SQL types.
+ * @param func Function to be called on every group.
+ *
+ * See [Encoder] for more details on what types are encodable to Spark SQL.
+ */
 inline fun <K, V, reified S, reified U> KeyValueGroupedDataset<K, V>.mapGroupsWithState(
     noinline func: (key: K, values: Iterator<V>, state: GroupState<S>) -> U,
 ): Dataset<U> = mapGroupsWithState(
@@ -266,6 +416,22 @@ inline fun <K, V, reified S, reified U> KeyValueGroupedDataset<K, V>.mapGroupsWi
     encoder<U>()
 )
 
+/**
+ * (Kotlin-specific)
+ * Applies the given function to each group of data, while maintaining a user-defined per-group
+ * state. The result Dataset will represent the objects returned by the function.
+ * For a static batch Dataset, the function will be invoked once per group. For a streaming
+ * Dataset, the function will be invoked for each group repeatedly in every trigger, and
+ * updates to each group's state will be saved across invocations.
+ * See [org.apache.spark.sql.streaming.GroupState] for more details.
+ *
+ * @param S The type of the user-defined state. Must be encodable to Spark SQL types.
+ * @param U The type of the output objects. Must be encodable to Spark SQL types.
+ * @param func Function to be called on every group.
+ * @param timeoutConf Timeout configuration for groups that do not receive data for a while.
+ *
+ * See [Encoder] for more details on what types are encodable to Spark SQL.
+ */
 inline fun <K, V, reified S, reified U> KeyValueGroupedDataset<K, V>.mapGroupsWithState(
     timeoutConf: GroupStateTimeout,
     noinline func: (key: K, values: Iterator<V>, state: GroupState<S>) -> U,
@@ -276,6 +442,23 @@ inline fun <K, V, reified S, reified U> KeyValueGroupedDataset<K, V>.mapGroupsWi
     timeoutConf
 )
 
+/**
+ * (Kotlin-specific)
+ * Applies the given function to each group of data, while maintaining a user-defined per-group
+ * state. The result Dataset will represent the objects returned by the function.
+ * For a static batch Dataset, the function will be invoked once per group. For a streaming
+ * Dataset, the function will be invoked for each group repeatedly in every trigger, and
+ * updates to each group's state will be saved across invocations.
+ * See [GroupState] for more details.
+ *
+ * @param S The type of the user-defined state. Must be encodable to Spark SQL types.
+ * @param U The type of the output objects. Must be encodable to Spark SQL types.
+ * @param func Function to be called on every group.
+ * @param outputMode The output mode of the function.
+ * @param timeoutConf Timeout configuration for groups that do not receive data for a while.
+ *
+ * See [Encoder] for more details on what types are encodable to Spark SQL.
+ */
 inline fun <K, V, reified S, reified U> KeyValueGroupedDataset<K, V>.flatMapGroupsWithState(
     outputMode: OutputMode,
     timeoutConf: GroupStateTimeout,
@@ -288,6 +471,13 @@ inline fun <K, V, reified S, reified U> KeyValueGroupedDataset<K, V>.flatMapGrou
     timeoutConf
 )
 
+/**
+ * (Kotlin-specific)
+ * Applies the given function to each cogrouped data. For each unique group, the function will
+ * be passed the grouping key and 2 iterators containing all elements in the group from
+ * [Dataset] [this] and [other].  The function can return an iterator containing elements of an
+ * arbitrary type which will be returned as a new [Dataset].
+ */
 inline fun <K, V, U, reified R> KeyValueGroupedDataset<K, V>.cogroup(
     other: KeyValueGroupedDataset<K, U>,
     noinline func: (key: K, left: Iterator<V>, right: Iterator<U>) -> Iterator<R>,
@@ -297,30 +487,93 @@ inline fun <K, V, U, reified R> KeyValueGroupedDataset<K, V>.cogroup(
     encoder<R>()
 )
 
+/** DEPRECATED: Use [as] or [to] for this. */
+@Deprecated(
+    message = "Deprecated, since we already have `as`() and to().",
+    replaceWith = ReplaceWith("this.to<R>()"),
+    level = DeprecationLevel.ERROR,
+)
 inline fun <T, reified R> Dataset<T>.downcast(): Dataset<R> = `as`(encoder<R>())
+
+/**
+ * (Kotlin-specific)
+ * Returns a new Dataset where each record has been mapped on to the specified type. The
+ * method used to map columns depend on the type of [R]:
+ * - When [R] is a class, fields for the class will be mapped to columns of the same name
+ *   (case sensitivity is determined by [spark.sql.caseSensitive]).
+ * - When [R] is a tuple, the columns will be mapped by ordinal (i.e. the first column will
+ *   be assigned to `_1`).
+ * - When [R] is a primitive type (i.e. [String], [Int], etc.), then the first column of the
+ *   `DataFrame` will be used.
+ *
+ * If the schema of the Dataset does not match the desired [R] type, you can use [Dataset.select]/[selectTyped]
+ * along with [Dataset.alias] or [as]/[to] to rearrange or rename as required.
+ *
+ * Note that [as]/[to] only changes the view of the data that is passed into typed operations,
+ * such as [map], and does not eagerly project away any columns that are not present in
+ * the specified class.
+ *
+ * @see to as alias for [as]
+ */
 inline fun <reified R> Dataset<*>.`as`(): Dataset<R> = `as`(encoder<R>())
+
+/**
+ * (Kotlin-specific)
+ * Returns a new Dataset where each record has been mapped on to the specified type. The
+ * method used to map columns depend on the type of [R]:
+ * - When [R] is a class, fields for the class will be mapped to columns of the same name
+ *   (case sensitivity is determined by [spark.sql.caseSensitive]).
+ * - When [R] is a tuple, the columns will be mapped by ordinal (i.e. the first column will
+ *   be assigned to `_1`).
+ * - When [R] is a primitive type (i.e. [String], [Int], etc.), then the first column of the
+ *   `DataFrame` will be used.
+ *
+ * If the schema of the Dataset does not match the desired [R] type, you can use [Dataset.select]/[selectTyped]
+ * along with [Dataset.alias] or [as]/[to] to rearrange or rename as required.
+ *
+ * Note that [as]/[to] only changes the view of the data that is passed into typed operations,
+ * such as [map], and does not eagerly project away any columns that are not present in
+ * the specified class.
+ *
+ * @see as as alias for [to]
+ */
 inline fun <reified R> Dataset<*>.to(): Dataset<R> = `as`(encoder<R>())
 
-inline fun <reified T> Dataset<T>.forEach(noinline func: (T) -> Unit) = foreach(ForeachFunction(func))
+/**
+ * (Kotlin-specific)
+ * Applies a function [func] to all rows.
+ */
+inline fun <reified T> Dataset<T>.forEach(noinline func: (T) -> Unit): Unit = foreach(ForeachFunction(func))
 
-inline fun <reified T> Dataset<T>.forEachPartition(noinline func: (Iterator<T>) -> Unit) =
+/**
+ * (Kotlin-specific)
+ * Runs [func] on each partition of this Dataset.
+ */
+inline fun <reified T> Dataset<T>.forEachPartition(noinline func: (Iterator<T>) -> Unit): Unit =
     foreachPartition(ForeachPartitionFunction(func))
 
 /**
  * It's hard to call `Dataset.debugCodegen` from kotlin, so here is utility for that
  */
-fun <T> Dataset<T>.debugCodegen() = also { KSparkExtensions.debugCodegen(it) }
+fun <T> Dataset<T>.debugCodegen(): Dataset<T> = also { KSparkExtensions.debugCodegen(it) }
 
-val SparkSession.sparkContext
+/**
+ * Returns the Spark context associated with this Spark session.
+ */
+val SparkSession.sparkContext: SparkContext
     get() = KSparkExtensions.sparkContext(this)
 
 /**
  * It's hard to call `Dataset.debug` from kotlin, so here is utility for that
  */
-fun <T> Dataset<T>.debug() = also { KSparkExtensions.debug(it) }
+fun <T> Dataset<T>.debug(): Dataset<T> = also { KSparkExtensions.debug(it) }
 
 @Suppress("FunctionName")
-@Deprecated("Changed to \"`===`\" to better reflect Scala API.", ReplaceWith("this `===` c"))
+@Deprecated(
+    message = "Changed to \"`===`\" to better reflect Scala API.",
+    replaceWith = ReplaceWith("this `===` c"),
+    level = DeprecationLevel.ERROR,
+)
 infix fun Column.`==`(c: Column) = `$eq$eq$eq`(c)
 
 /**
@@ -648,7 +901,17 @@ operator fun Column.rem(other: Any): Column = `$percent`(other)
  */
 operator fun Column.get(key: Any): Column = getItem(key)
 
-fun lit(a: Any) = functions.lit(a)
+/**
+ * Creates a [Column] of literal value.
+ *
+ * The passed in object is returned directly if it is already a [Column].
+ * If the object is a Scala Symbol, it is converted into a [Column] also.
+ * Otherwise, a new [Column] is created to represent the literal value.
+ *
+ * This is just a shortcut to the function from [org.apache.spark.sql.functions].
+ * For all the functions, simply add `import org.apache.spark.sql.functions.*` to your file.
+ */
+fun lit(a: Any): Column = functions.lit(a)
 
 /**
  * Provides a type hint about the expected return value of this column. This information can
@@ -755,8 +1018,15 @@ inline fun <reified T, R> Dataset<T>.withCached(
     return cached.executeOnCached().also { cached.unpersist(blockingUnpersist) }
 }
 
-inline fun <reified T> Dataset<Row>.toList() = KSparkExtensions.collectAsList(to<T>())
-inline fun <reified R> Dataset<*>.toArray(): Array<R> = to<R>().collect() as Array<R>
+/**
+ * Collects the dataset as list where each item has been mapped to type [T].
+ */
+inline fun <reified T> Dataset<*>.toList(): List<T> = to<T>().collectAsList() as List<T>
+
+/**
+ * Collects the dataset as Array where each item has been mapped to type [T].
+ */
+inline fun <reified T> Dataset<*>.toArray(): Array<T> = to<T>().collect() as Array<T>
 
 /**
  * Selects column based on the column name and returns it as a [Column].
@@ -773,7 +1043,6 @@ operator fun <T> Dataset<T>.invoke(colName: String): Column = col(colName)
  * ```
  * @see invoke
  */
-
 @Suppress("UNCHECKED_CAST")
 inline fun <reified T, reified U> Dataset<T>.col(column: KProperty1<T, U>): TypedColumn<T, U> =
     col(column.name).`as`<U>() as TypedColumn<T, U>
@@ -888,6 +1157,14 @@ inline fun <reified T, reified U1, reified U2, reified U3, reified U4, reified U
     ).map { Arity5(it._1(), it._2(), it._3(), it._4(), it._5()) }
 
 
+/**
+ * Not meant to be used by the user explicitly.
+ *
+ * This function generates the DataType schema for supported classes, including Kotlin data classes, [Map],
+ * [Iterable], [Product], [Array], and combinations of those.
+ *
+ * It's mainly used by [generateEncoder]/[encoder].
+ */
 @OptIn(ExperimentalStdlibApi::class)
 fun schema(type: KType, map: Map<String, KType> = mapOf()): DataType {
     val primitiveSchema = knownDataTypes[type.classifier]
@@ -987,15 +1264,24 @@ fun schema(type: KType, map: Map<String, KType> = mapOf()): DataType {
     }
 }
 
+/**
+ * The entry point to programming Spark with the Dataset and DataFrame API.
+ *
+ * @see org.apache.spark.sql.SparkSession
+ */
 typealias SparkSession = org.apache.spark.sql.SparkSession
 
-fun SparkContext.setLogLevel(level: SparkLogLevel) = setLogLevel(level.name)
+/**
+ * Control our logLevel. This overrides any user-defined log settings.
+ * @param level The desired log level as [SparkLogLevel].
+ */
+fun SparkContext.setLogLevel(level: SparkLogLevel): Unit = setLogLevel(level.name)
 
 enum class SparkLogLevel {
     ALL, DEBUG, ERROR, FATAL, INFO, OFF, TRACE, WARN
 }
 
-private val knownDataTypes = mapOf(
+private val knownDataTypes: Map<KClass<out Any>, DataType> = mapOf(
     Byte::class to DataTypes.ByteType,
     Short::class to DataTypes.ShortType,
     Int::class to DataTypes.IntegerType,
@@ -1007,7 +1293,7 @@ private val knownDataTypes = mapOf(
     LocalDate::class to `DateType$`.`MODULE$`,
     Date::class to `DateType$`.`MODULE$`,
     Timestamp::class to `TimestampType$`.`MODULE$`,
-    Instant::class to `TimestampType$`.`MODULE$`
+    Instant::class to `TimestampType$`.`MODULE$`,
 )
 
 private fun transitiveMerge(a: Map<String, KType>, b: Map<String, KType>): Map<String, KType> {
@@ -1017,11 +1303,12 @@ private fun transitiveMerge(a: Map<String, KType>, b: Map<String, KType>): Map<S
 }
 
 class Memoize1<in T, out R>(val f: (T) -> R) : (T) -> R {
+
     private val values = ConcurrentHashMap<T, R>()
-    override fun invoke(x: T) =
-        values.getOrPut(x, { f(x) })
+
+    override fun invoke(x: T): R = values.getOrPut(x) { f(x) }
 }
 
 private fun <T, R> ((T) -> R).memoize(): (T) -> R = Memoize1(this)
 
-private val memoizedSchema = { x: KType -> schema(x) }.memoize()
+private val memoizedSchema: (KType) -> DataType = { x: KType -> schema(x) }.memoize()
diff --git a/kotlin-spark-api/common/src/main/kotlin/org/jetbrains/kotlinx/spark/api/Iterators.kt b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/Iterators.kt
similarity index 91%
rename from kotlin-spark-api/common/src/main/kotlin/org/jetbrains/kotlinx/spark/api/Iterators.kt
rename to kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/Iterators.kt
index b93ce377..9f7de351 100644
--- a/kotlin-spark-api/common/src/main/kotlin/org/jetbrains/kotlinx/spark/api/Iterators.kt
+++ b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/Iterators.kt
@@ -57,9 +57,13 @@ class FilteringIterator<T>(
         done()
     }
 }
+
+/** Maps the values of the iterator lazily using [func]. */
 fun <T, R> Iterator<T>.map(func: (T) -> R): Iterator<R> = MappingIterator(this, func)
 
+/** Filters the values of the iterator lazily using [func]. */
 fun <T> Iterator<T>.filter(func: (T) -> Boolean): Iterator<T> = FilteringIterator(this, func)
 
+/** Partitions the values of the iterator lazily in groups of [size]. */
 fun <T> Iterator<T>.partition(size: Int): Iterator<List<T>> = PartitioningIterator(this, size)
 
diff --git a/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/SparkHelper.kt b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/SparkHelper.kt
index 3ef0b177..6188daae 100644
--- a/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/SparkHelper.kt
+++ b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/SparkHelper.kt
@@ -19,22 +19,27 @@
  */
 package org.jetbrains.kotlinx.spark.api
 
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.SparkSession.Builder
 import org.apache.spark.sql.UDFRegistration
 import org.jetbrains.kotlinx.spark.api.SparkLogLevel.ERROR
 
 /**
- * Wrapper for spark creation which allows to set different spark params
+ * Wrapper for spark creation which allows setting different spark params.
  *
  * @param props spark options, value types are runtime-checked for type-correctness
- * @param master [SparkSession.Builder.master]
- * @param appName [SparkSession.Builder.appName]
+ * @param master Sets the Spark master URL to connect to, such as "local" to run locally, "local[4]" to
+ *  run locally with 4 cores, or "spark://master:7077" to run on a Spark standalone cluster. By default, it
+ *  tries to get the system value "spark.master", otherwise it uses "local[*]"
+ * @param appName Sets a name for the application, which will be shown in the Spark web UI.
+ *  If no application name is set, a randomly generated name will be used.
+ * @param logLevel Control our logLevel. This overrides any user-defined log settings.
  * @param func function which will be executed in context of [KSparkSession] (it means that `this` inside block will point to [KSparkSession])
  */
 @JvmOverloads
 inline fun withSpark(
     props: Map<String, Any> = emptyMap(),
-    master: String = "local[*]",
+    master: String = SparkConf().get("spark.master", "local[*]"),
     appName: String = "Kotlin Spark Sample",
     logLevel: SparkLogLevel = ERROR,
     func: KSparkSession.() -> Unit,
@@ -58,10 +63,17 @@ inline fun withSpark(
 
 }
 
+/**
+ * Wrapper for spark creation which allows setting different spark params.
+ *
+ * @param builder A [SparkSession.Builder] object, configured how you want.
+ * @param logLevel Control our logLevel. This overrides any user-defined log settings.
+ * @param func function which will be executed in context of [KSparkSession] (it means that `this` inside block will point to [KSparkSession])
+ */
 @JvmOverloads
 inline fun withSpark(builder: Builder, logLevel: SparkLogLevel = ERROR, func: KSparkSession.() -> Unit) {
     builder
-        .orCreate
+        .getOrCreate()
         .apply {
             KSparkSession(this).apply {
                 sparkContext.setLogLevel(logLevel)
diff --git a/kotlin-spark-api/common/src/main/kotlin/org/jetbrains/kotlinx/spark/api/VarArities.kt b/kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/VarArities.kt
similarity index 100%
rename from kotlin-spark-api/common/src/main/kotlin/org/jetbrains/kotlinx/spark/api/VarArities.kt
rename to kotlin-spark-api/3.2/src/main/kotlin/org/jetbrains/kotlinx/spark/api/VarArities.kt
diff --git a/kotlin-spark-api/common/pom.xml b/kotlin-spark-api/common/pom.xml
deleted file mode 100644
index 19959fdb..00000000
--- a/kotlin-spark-api/common/pom.xml
+++ /dev/null
@@ -1,56 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
-  <modelVersion>4.0.0</modelVersion>
-
-  <name>Kotlin Spark API: Common</name>
-  <artifactId>kotlin-spark-api-common</artifactId>
-  <description>Kotlin API for Apache Spark: common parts</description>
-  <parent>
-    <groupId>org.jetbrains.kotlinx.spark</groupId>
-    <artifactId>kotlin-spark-api-parent</artifactId>
-    <version>1.0.4-SNAPSHOT</version>
-    <relativePath>../..</relativePath>
-  </parent>
-
-  <dependencies>
-    <dependency>
-      <groupId>org.jetbrains.kotlin</groupId>
-      <artifactId>kotlin-stdlib-jdk8</artifactId>
-    </dependency>
-  </dependencies>
-
-  <build>
-    <sourceDirectory>src/main/kotlin</sourceDirectory>
-    <testSourceDirectory>src/test/kotlin</testSourceDirectory>
-    <plugins>
-      <plugin>
-        <groupId>org.jetbrains.kotlin</groupId>
-        <artifactId>kotlin-maven-plugin</artifactId>
-      </plugin>
-      <plugin>
-        <groupId>org.jetbrains.dokka</groupId>
-        <artifactId>dokka-maven-plugin</artifactId>
-        <version>${dokka.version}</version>
-        <configuration>
-          <jdkVersion>8</jdkVersion>
-        </configuration>
-        <executions>
-          <execution>
-            <id>dokka</id>
-            <goals>
-              <goal>dokka</goal>
-            </goals>
-            <phase>pre-site</phase>
-          </execution>
-          <execution>
-            <id>javadocjar</id>
-            <goals>
-              <goal>javadocJar</goal>
-            </goals>
-            <phase>pre-integration-test</phase>
-          </execution>
-        </executions>
-      </plugin>
-    </plugins>
-  </build>
-</project>
diff --git a/pom.xml b/pom.xml
index 4f0974c5..47043737 100644
--- a/pom.xml
+++ b/pom.xml
@@ -11,7 +11,7 @@
 
     <properties>
         <kotlin.version>1.5.30</kotlin.version>
-        <dokka.version>1.4.32</dokka.version>
+        <dokka.version>1.6.10</dokka.version>
         <atrium.version>0.16.0</atrium.version>
         <kotest.version>4.6.0</kotest.version>
         <kotest-extension-allure.version>1.0.1</kotest-extension-allure.version>
@@ -35,7 +35,6 @@
     </properties>
 
     <modules>
-        <module>kotlin-spark-api/common</module>
         <module>dummy</module>
     </modules>
 
@@ -51,11 +50,6 @@
                 <artifactId>kotlin-reflect</artifactId>
                 <version>${kotlin.version}</version>
             </dependency>
-            <dependency>
-                <groupId>org.jetbrains.kotlinx.spark</groupId>
-                <artifactId>kotlin-spark-api-common</artifactId>
-                <version>${project.version}</version>
-            </dependency>
         </dependencies>
     </dependencyManagement>