garage-education
diff --git a/‎Code/20-spark-operations/20-spark-operations.ipynb
+18-10 b/‎Code/20-spark-operations/20-spark-operations.ipynb
+18-10
diff --git a/‎Code/20-spark-operations/20-spark-operations.md
+137 b/‎Code/20-spark-operations/20-spark-operations.md
+137
diff --git a/‎Code/22-spark-immutability/22-spark-immutablility-example.ipynb
+18-11 b/‎Code/22-spark-immutability/22-spark-immutablility-example.ipynb
+18-11
@@ -32,11 +32,13 @@
    },
    "outputs": [
     {
-     "output_type": "stream",
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Original RDD ID: 227\nOriginal RDD ID: 227\nTransformed RDD ID: 228\nTransformed RDD result: [2, 4, 6, 8, 10]\n"
+      "Original RDD ID: 227\n",
+      "Original RDD ID: 227\n",
+      "Transformed RDD ID: 228\n",
+      "Transformed RDD result: [2, 4, 6, 8, 10]\n"
      ]
     }
    ],
@@ -73,7 +75,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -142,7 +143,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -228,11 +228,14 @@
    },
    "outputs": [
     {
-     "output_type": "stream",
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Original RDD:\n('John', 28)\n('Smith', 44)\n('Adam', 65)\n('Henry', 23)\n"
+      "Original RDD:\n",
+      "('John', 28)\n",
+      "('Smith', 44)\n",
+      "('Adam', 65)\n",
+      "('Henry', 23)\n"
      ]
     }
    ],
@@ -264,11 +267,15 @@
    },
    "outputs": [
     {
-     "output_type": "stream",
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Original RDD ID: 316\nOriginal RDD ID After filter: 317\nTransformed RDD ID: 318\nFiltered RDD:\n('Smith', 44)\n('Adam', 65)\n"
+      "Original RDD ID: 316\n",
+      "Original RDD ID After filter: 317\n",
+      "Transformed RDD ID: 318\n",
+      "Filtered RDD:\n",
+      "('Smith', 44)\n",
+      "('Adam', 65)\n"
      ]
     }
    ],
@@ -307,7 +314,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -406,7 +412,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -518,6 +523,9 @@
    },
    "notebookName": "20-spark-operations",
    "widgets": {}
+  },
+  "jupytext": {
+   "formats": "ipynb,md"
   }
  },
  "nbformat": 4,
 
@@ -0,0 +1,137 @@
+---
+jupyter:
+  jupytext:
+    formats: ipynb,md
+    main_language: python
+    text_representation:
+      extension: .md
+      format_name: markdown
+      format_version: '1.3'
+      jupytext_version: 1.16.2
+---
+
+# Immutable RDDs
+
+```python
+# Test Immutable RDDs
+numbers = [1, 2, 3, 4, 5]
+numbers_rdd = sc.parallelize(numbers)
+print(f"Original RDD ID: {numbers_rdd.id()}")
+print(f"Original RDD ID: {numbers_rdd.id()}")
+
+# # Apply a transformation: multiply each number by 2
+transformed_rdd = numbers_rdd.map(lambda x: x * 2)
+print(f"Transformed RDD ID: {transformed_rdd.id()}")
+
+# # Collect the results to trigger the computation
+result = transformed_rdd.collect()
+print(f"Transformed RDD result: {result}")
+
+```
+
+```python
+%scala
+// Test Immutable RDDs
+val numbers = List(1, 2, 3, 4, 5)
+val numbersRdd = sc.parallelize(numbers)
+println(s"Original RDD ID: ${numbersRdd.id}")
+println(s"Original RDD ID: ${numbersRdd.id}")
+println(s"Original RDD ID: ${numbersRdd.id}")
+
+
+```
+
+```python
+%scala
+
+// numbersRdd = numbersRdd.map(x => x * 2) //OPS!!!!!!!!!!!
+
+// Apply a transformation: multiply each number by 2
+val transformedRdd = numbersRdd.map(x => x * 2)
+println(s"Transformed RDD ID: ${transformedRdd.id}")
+
+// Collect the results to trigger the computation
+val result = transformedRdd.collect()
+println(s"Transformed RDD result: ${result.mkString(", ")}")
+```
+
+# Immutable DF Example
+
+```python
+# Create an RDD
+data = [("John", 28), ("Smith", 44), ("Adam", 65), ("Henry", 23)]
+rdd = sc.parallelize(data)
+
+# Show the original RDD
+print("Original RDD:")
+for row in rdd.collect():
+    print(row)
+
+```
+
+```python
+
+print(f"Original RDD ID: {rdd.id()}")
+
+rdd = rdd.filter(lambda x: x[1] > 30)
+
+print(f"Original RDD ID After filter: {rdd.id()}")
+
+# Filter rows where the age is greater than 30
+filtered_rdd = rdd.filter(lambda x: x[1] > 30)
+print(f"Transformed RDD ID: {filtered_rdd.id()}")
+
+# Show the transformed RDD
+print("Filtered RDD:")
+for row in filtered_rdd.collect():
+    print(row)
+```
+
+```python
+%scala
+    // Create an RDD
+    val data = Seq(("John", 28), ("Smith", 44), ("Adam", 65), ("Henry", 23))
+    val rdd = sc.parallelize(data)
+
+    // Show the original RDD
+    println("Original RDD:")
+    rdd.collect().foreach(println)
+    //rdd = rdd.filter{ case (name, age) => age > 30 }
+    // // Filter rows where the age is greater than 30
+    val filteredRdd = rdd.filter{ case (name, age) => age > 30 }
+    println(s"Transformed RDD ID: ${filteredRdd.id}")
+
+    // Show the transformed RDD
+    println("Filtered RDD:")
+    filteredRdd.collect().foreach(println)
+```
+
+# Spark Lazy Evaluation 
+
+```python
+# Create an RDD
+rdd = sc.parallelize([
+    ("John", 28),
+    ("Smith", 44),
+    ("Adam", 65),
+    ("Henry", 23)
+])
+
+# Apply a map transformation to create a new RDD with a tuple including the name and a boolean flag
+# if the person is older than 30
+mapped_rdd = rdd.map(lambda x: (x[0], x[1], x[1] > 30))
+
+# Filter the RDD to include only people older than 30
+filtered_rdd = mapped_rdd.filter(lambda x: x[2])
+
+# Convert the filtered RDD back to a DataFrame
+df = spark.createDataFrame(filtered_rdd, ["Name", "Age", "OlderThan30"])
+
+# Select only the name and age columns
+final_df = df.select("Name", "Age")
+
+# # Collect the results which triggers the execution of all transformations
+results = final_df.collect()
+display(results)
+
+```
@@ -32,11 +32,13 @@
    },
    "outputs": [
     {
-     "output_type": "stream",
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Original RDD ID: 227\nOriginal RDD ID: 227\nTransformed RDD ID: 228\nTransformed RDD result: [2, 4, 6, 8, 10]\n"
+      "Original RDD ID: 227\n",
+      "Original RDD ID: 227\n",
+      "Transformed RDD ID: 228\n",
+      "Transformed RDD result: [2, 4, 6, 8, 10]\n"
      ]
     }
    ],
@@ -73,7 +75,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -142,7 +143,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -213,7 +213,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -292,11 +291,14 @@
    },
    "outputs": [
     {
-     "output_type": "stream",
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Original RDD:\n('John', 28)\n('Smith', 44)\n('Adam', 65)\n('Henry', 23)\n"
+      "Original RDD:\n",
+      "('John', 28)\n",
+      "('Smith', 44)\n",
+      "('Adam', 65)\n",
+      "('Henry', 23)\n"
      ]
     }
    ],
@@ -328,11 +330,15 @@
    },
    "outputs": [
     {
-     "output_type": "stream",
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Original RDD ID: 316\nOriginal RDD ID After filter: 317\nTransformed RDD ID: 318\nFiltered RDD:\n('Smith', 44)\n('Adam', 65)\n"
+      "Original RDD ID: 316\n",
+      "Original RDD ID After filter: 317\n",
+      "Transformed RDD ID: 318\n",
+      "Filtered RDD:\n",
+      "('Smith', 44)\n",
+      "('Adam', 65)\n"
      ]
     }
    ],
@@ -371,7 +377,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -470,7 +475,6 @@
    },
    "outputs": [
     {
-     "output_type": "display_data",
      "data": {
       "text/html": [
        "<style scoped>\n",
@@ -582,6 +586,9 @@
    },
    "notebookName": "22-spark-immutablility-example",
    "widgets": {}
+  },
+  "jupytext": {
+   "formats": "ipynb,md"
   }
  },
  "nbformat": 4,