diff --git a/build.gradle b/build.gradle
index b61140999a82f8..f4fb7b42d8560b 100644
--- a/build.gradle
+++ b/build.gradle
@@ -54,7 +54,7 @@ buildscript {
   ext.hazelcastVersion = '5.3.6'
   ext.ebeanVersion = '12.16.1'
   ext.googleJavaFormatVersion = '1.18.1'
-  ext.openLineageVersion = '1.5.0'
+  ext.openLineageVersion = '1.13.1'
   ext.logbackClassicJava8 = '1.2.12'
 
   ext.docker_registry = 'acryldata'
diff --git a/docs-website/filterTagIndexes.json b/docs-website/filterTagIndexes.json
index 64cb734e6d984c..0c1f541cf53d34 100644
--- a/docs-website/filterTagIndexes.json
+++ b/docs-website/filterTagIndexes.json
@@ -77,6 +77,17 @@
         "Features": ""
       }
     },
+    {
+      "Path": "docs/lineage/dagster",
+      "imgPath": "img/logos/platforms/dagster.svg",
+      "Title": "Dagster",
+      "Description": "Dagster is a next-generation open source orchestration platform for the development, production, and observation of data assets..",
+      "tags": {
+        "Platform Type": "Orchestrator",
+        "Connection Type": "Pull",
+        "Features": "Stateful Ingestion, UI Ingestion, Status Aspect"
+      }
+    },
     {
       "Path": "docs/generated/ingestion/sources/databricks",
       "imgPath": "img/logos/platforms/databricks.png",
@@ -433,7 +444,7 @@
       "Path": "docs/generated/ingestion/sources/hive-metastore",
       "imgPath": "img/logos/platforms/presto.svg",
       "Title": "Hive Metastore",
-      "Description": "Presto on Hive is a data tool that allows users to query and analyze large datasets stored in Hive using SQL-like syntax.",
+      "Description": "Hive Metastore (HMS) is a service that stores metadata that is related to Hive, Presto, Trino and other services in a backend Relational Database Management System (RDBMS) ",
       "tags": {
         "Platform Type": "Datastore",
         "Connection Type": "Pull",
@@ -551,7 +562,7 @@
       }
     },
     {
-      "Path": "docs/metadata-integration/java/spark-lineage",
+      "Path": "docs/metadata-integration/java/spark-lineage-beta",
       "imgPath": "img/logos/platforms/spark.svg",
       "Title": "Spark",
       "Description": "Spark is a data processing tool that enables fast and efficient processing of large-scale data sets using distributed computing.",
diff --git a/docs-website/sidebars.js b/docs-website/sidebars.js
index 865b37c961a717..f26853a488b62a 100644
--- a/docs-website/sidebars.js
+++ b/docs-website/sidebars.js
@@ -317,6 +317,11 @@ module.exports = {
           id: "docs/lineage/dagster",
           label: "Dagster",
         },
+        {
+          type: "doc",
+          id: "docs/lineage/openlineage",
+          label: "OpenLineage",
+        },
         {
           type: "doc",
           id: "metadata-integration/java/spark-lineage/README",
diff --git a/docs-website/static/img/logos/platforms/dagster.svg b/docs-website/static/img/logos/platforms/dagster.svg
new file mode 100644
index 00000000000000..d2ae628553a7dd
--- /dev/null
+++ b/docs-website/static/img/logos/platforms/dagster.svg
@@ -0,0 +1,11 @@
+<svg width="560" height="560" viewBox="0 0 560 560" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M221.556 440.815C221.562 442.771 221.97 444.704 222.757 446.494C223.543 448.285 224.689 449.894 226.125 451.221C227.56 452.548 229.254 453.565 231.1 454.208C232.946 454.851 234.905 455.107 236.854 454.959C310.941 449.655 380.913 397.224 403.252 315.332C404.426 310.622 407.96 308.26 412.669 308.26C415.082 308.357 417.36 309.402 419.009 311.168C420.658 312.933 421.545 315.278 421.477 317.694C421.477 335.953 398.006 383.674 364.442 411.368C362.731 412.807 361.367 414.614 360.452 416.654C359.536 418.694 359.092 420.914 359.154 423.149C359.188 424.967 359.58 426.76 360.308 428.425C361.036 430.091 362.086 431.596 363.397 432.855C364.708 434.114 366.254 435.101 367.948 435.761C369.641 436.421 371.448 436.739 373.264 436.699C376.205 436.699 380.913 434.931 386.795 429.627C410.266 408.412 455 348.909 455 283.508C455 187.624 380.872 105 277.418 105C185.106 105 105.138 180.414 105.138 267.611C105.138 325.345 151.004 368.937 211.56 368.937C258.019 368.937 300.945 335.953 312.708 290.58C313.881 285.87 317.402 283.508 322.11 283.508C324.525 283.606 326.804 284.65 328.455 286.415C330.106 288.181 330.996 290.525 330.933 292.942C330.933 313.564 292.122 385.484 213.327 385.484C194.509 385.484 170.996 380.18 154.524 370.746C152.319 369.677 149.917 369.075 147.469 368.978C145.594 368.906 143.725 369.223 141.979 369.909C140.232 370.594 138.647 371.634 137.321 372.962C135.996 374.291 134.96 375.879 134.278 377.627C133.596 379.376 133.283 381.247 133.359 383.122C133.435 385.524 134.123 387.867 135.357 389.929C136.592 391.991 138.332 393.703 140.414 394.904C162.173 407.334 188.047 413.757 214.501 413.757C280.359 413.757 340.335 368.978 357.98 302.997C359.154 298.287 362.688 295.926 367.383 295.926C369.797 296.023 372.077 297.067 373.728 298.832C375.379 300.598 376.269 302.943 376.205 305.359C376.205 332.459 327.992 419.655 235.087 426.727C231.492 426.994 228.123 428.579 225.625 431.18C223.128 433.78 221.679 437.211 221.556 440.815V440.815Z" fill="#4F43DD"/>
+<path d="M313.62 215.178C326.301 215.083 338.748 218.589 349.517 225.288C350.605 219.33 351.206 213.292 351.312 207.236C351.312 179.266 329.995 154.211 304.038 154.211C283.853 154.211 271.233 170.937 271.233 191.6C271.137 202.763 275.057 213.588 282.279 222.098C292.062 217.431 302.782 215.064 313.62 215.178V215.178Z" fill="white"/>
+<path d="M374.439 316.505C378.042 304.185 379.63 295.635 379.63 290.083C379.52 287.685 378.493 285.421 376.761 283.76C375.028 282.099 372.724 281.168 370.325 281.16C368.089 281.202 365.932 281.99 364.196 283.399C362.46 284.808 361.244 286.757 360.743 288.936C359.762 292.983 357.664 303.95 355.593 310.912C356.449 308.306 357.231 305.658 357.94 302.97C359.114 298.246 362.648 295.898 367.342 295.898C369.756 295.991 372.035 297.033 373.687 298.796C375.338 300.559 376.228 302.902 376.165 305.318C376.054 309.115 375.446 312.881 374.356 316.519L374.439 316.505Z" fill="#352D8E"/>
+<path d="M424.418 303.632C424.305 301.237 423.278 298.977 421.55 297.317C419.821 295.658 417.522 294.724 415.126 294.709C412.893 294.754 410.739 295.543 409.006 296.952C407.272 298.36 406.059 300.308 405.558 302.485C404.564 306.629 402.424 317.761 400.325 324.709H400.422C401.444 321.615 402.396 318.48 403.183 315.289C404.357 310.565 407.891 308.217 412.599 308.217C415.012 308.311 417.29 309.353 418.939 311.116C420.588 312.88 421.475 315.223 421.408 317.637C421.341 320.569 420.938 323.485 420.207 326.325C423.134 316.049 424.418 308.618 424.418 303.632Z" fill="#352D8E"/>
+<path d="M313.619 215.178C319.921 215.166 326.196 216.007 332.272 217.678C335.462 213.326 337.056 208.008 336.786 202.618C336.516 197.228 334.398 192.095 330.789 188.084C327.18 184.073 322.3 181.428 316.97 180.594C311.64 179.761 306.185 180.789 301.524 183.507L311.189 199.419L293.089 191.587C290.637 195.545 289.407 200.139 289.555 204.793C289.702 209.446 291.22 213.953 293.917 217.747C300.34 216.016 306.967 215.152 313.619 215.178V215.178Z" fill="#030615"/>
+<path d="M174.172 317.583C181.797 317.583 187.979 311.399 187.979 303.771C187.979 296.143 181.797 289.959 174.172 289.959C166.547 289.959 160.365 296.143 160.365 303.771C160.365 311.399 166.547 317.583 174.172 317.583Z" fill="#352D8E"/>
+<path d="M174.172 262.335C181.797 262.335 187.979 256.151 187.979 248.523C187.979 240.895 181.797 234.711 174.172 234.711C166.547 234.711 160.365 240.895 160.365 248.523C160.365 256.151 166.547 262.335 174.172 262.335Z" fill="#352D8E"/>
+<path d="M146.558 289.958C154.183 289.958 160.364 283.774 160.364 276.146C160.364 268.518 154.183 262.334 146.558 262.334C138.932 262.334 132.751 268.518 132.751 276.146C132.751 283.774 138.932 289.958 146.558 289.958Z" fill="#352D8E"/>
+<path d="M208.688 368.91H211.45C257.909 368.91 300.835 335.927 312.598 290.554C313.771 285.844 317.292 283.482 322 283.482C324.415 283.579 326.694 284.624 328.345 286.389C329.996 288.155 330.886 290.499 330.823 292.916C330.612 297.737 329.522 302.479 327.606 306.908C327.939 306.393 328.23 305.853 328.476 305.292C331.969 297.304 333.774 288.679 333.777 279.96C333.777 266.41 324.361 257.571 310.844 257.571C287.276 257.571 282.554 278.151 272.614 300.154C262.3 322.999 243.357 347.709 195.586 347.709C145.951 347.709 94.9487 312.944 107.389 242.253C107.54 241.369 107.665 240.582 107.761 239.85C105.939 248.982 105.014 258.272 105 267.584C105.138 324.491 149.582 367.585 208.688 368.91Z" fill="#352D8E"/>
+</svg>
diff --git a/docs/lineage/openlineage.md b/docs/lineage/openlineage.md
new file mode 100644
index 00000000000000..0b9423bf2c4da7
--- /dev/null
+++ b/docs/lineage/openlineage.md
@@ -0,0 +1,92 @@
+# OpenLineage
+
+DataHub, now supports [OpenLineage](https://openlineage.io/) integration. With this support, DataHub can ingest and display lineage information from various data processing frameworks, providing users with a comprehensive understanding of their data pipelines.
+
+## Features
+
+- **REST Endpoint Support**: DataHub now includes a REST endpoint that can understand OpenLineage events. This allows users to send lineage information directly to DataHub, enabling easy integration with various data processing frameworks.
+
+- **[Spark Event Listener Plugin](https://datahubproject.io/docs/metadata-integration/java/spark-lineage-beta)**: DataHub provides a Spark Event Listener plugin that seamlessly integrates OpenLineage's Spark plugin. This plugin enhances DataHub's OpenLineage support by offering additional features such as PathSpec support, column-level lineage, patch support and more.
+
+## OpenLineage Support with DataHub
+
+### 1. REST Endpoint Support
+
+DataHub's REST endpoint allows users to send OpenLineage events directly to DataHub. This enables easy integration with various data processing frameworks, providing users with a centralized location for viewing and managing data lineage information.
+
+With Spark and Airflow we recommend using the Spark Lineage or DataHub's Airflow plugin for tighter integration with DataHub.
+
+#### How to Use
+
+To send OpenLineage messages to DataHub using the REST endpoint, simply make a POST request to the following endpoint:
+
+```
+POST GMS_SERVER_HOST:GMS_PORT/api/v2/lineage
+```
+
+Include the OpenLineage message in the request body in JSON format.
+
+Example:
+
+```json
+{
+  "eventType": "START",
+  "eventTime": "2020-12-28T19:52:00.001+10:00",
+  "run": {
+    "runId": "d46e465b-d358-4d32-83d4-df660ff614dd"
+  },
+  "job": {
+    "namespace": "workshop",
+    "name": "process_taxes"
+  },
+  "inputs": [
+    {
+      "namespace": "postgres://workshop-db:None",
+      "name": "workshop.public.taxes",
+      "facets": {
+        "dataSource": {
+          "_producer": "https://github.com/OpenLineage/OpenLineage/tree/0.10.0/integration/airflow",
+          "_schemaURL": "https://raw.githubusercontent.com/OpenLineage/OpenLineage/main/spec/OpenLineage.json#/definitions/DataSourceDatasetFacet",
+          "name": "postgres://workshop-db:None",
+          "uri": "workshop-db"
+        }
+      }
+    }
+  ],
+  "producer": "https://github.com/OpenLineage/OpenLineage/blob/v1-0-0/client"
+}
+```
+##### How to set up Airflow
+Follow the Airflow guide to setup the Airflow DAGs to send lineage information to DataHub. The guide can be found [here](https://airflow.apache.org/docs/apache-airflow-providers-openlineage/stable/guides/user.html
+The transport should look like this:
+```json
+{"type": "http",
+  "url": "https://GMS_SERVER_HOST:GMS_PORT/openapi/openlineage/",
+  "endpoint": "api/v1/lineage",
+  "auth": {
+    "type": "api_key",
+    "api_key": "your-datahub-api-key"
+  }
+}
+```
+
+#### Known Limitations
+With Spark and Airflow we recommend using the Spark Lineage or DataHub's Airflow plugin for tighter integration with DataHub.
+
+- **[PathSpec](https://datahubproject.io/docs/metadata-integration/java/spark-lineage-beta/#configuring-hdfs-based-dataset-urns) Support**: While the REST endpoint supports OpenLineage messages, full [PathSpec](https://datahubproject.io/docs/metadata-integration/java/spark-lineage-beta/#configuring-hdfs-based-dataset-urns)) support is not yet available.
+
+- **Column-level Lineage**: DataHub's current OpenLineage support does not provide full column-level lineage tracking.
+- etc...
+### 2. Spark Event Listener Plugin
+
+DataHub's Spark Event Listener plugin enhances OpenLineage support by providing additional features such as PathSpec support, column-level lineage, and more.
+
+#### How to Use
+
+Follow the guides of the Spark Lineage plugin page for more information on how to set up the Spark Lineage plugin. The guide can be found [here](https://datahubproject.io/docs/metadata-integration/java/spark-lineage-beta)
+
+## References
+
+- [OpenLineage](https://openlineage.io/)
+- [DataHub OpenAPI Guide](../api/openapi/openapi-usage-guide.md)
+- [DataHub Spark Lineage Plugin](https://datahubproject.io/docs/metadata-integration/java/spark-lineage-beta)
diff --git a/metadata-integration/java/datahub-client/build.gradle b/metadata-integration/java/datahub-client/build.gradle
index eee84b1f8c8274..2328697632434b 100644
--- a/metadata-integration/java/datahub-client/build.gradle
+++ b/metadata-integration/java/datahub-client/build.gradle
@@ -27,7 +27,7 @@ dependencies {
     }
   }
 
-  compileOnly externalDependency.httpAsyncClient
+  compileOnly externalDependency.httpClient
   implementation externalDependency.jacksonDataBind
   runtimeOnly externalDependency.jna
 
@@ -41,7 +41,7 @@ dependencies {
   testImplementation externalDependency.mockServer
   testImplementation externalDependency.mockServerClient
   testImplementation externalDependency.testContainers
-  testImplementation externalDependency.httpAsyncClient
+  testImplementation externalDependency.httpClient
   testRuntimeOnly externalDependency.logbackClassic
 }
 
diff --git a/metadata-integration/java/datahub-client/src/main/java/datahub/client/MetadataResponseFuture.java b/metadata-integration/java/datahub-client/src/main/java/datahub/client/MetadataResponseFuture.java
index 89db9738efda69..11be10186f1ef3 100644
--- a/metadata-integration/java/datahub-client/src/main/java/datahub/client/MetadataResponseFuture.java
+++ b/metadata-integration/java/datahub-client/src/main/java/datahub/client/MetadataResponseFuture.java
@@ -7,16 +7,16 @@
 import java.util.concurrent.TimeoutException;
 import java.util.concurrent.atomic.AtomicReference;
 import lombok.SneakyThrows;
-import org.apache.http.HttpResponse;
+import org.apache.hc.client5.http.async.methods.SimpleHttpResponse;
 
 public class MetadataResponseFuture implements Future<MetadataWriteResponse> {
-  private final Future<HttpResponse> requestFuture;
+  private final Future<SimpleHttpResponse> requestFuture;
   private final AtomicReference<MetadataWriteResponse> responseReference;
   private final CountDownLatch responseLatch;
   private final ResponseMapper mapper;
 
   public MetadataResponseFuture(
-      Future<HttpResponse> underlyingFuture,
+      Future<SimpleHttpResponse> underlyingFuture,
       AtomicReference<MetadataWriteResponse> responseAtomicReference,
       CountDownLatch responseLatch) {
     this.requestFuture = underlyingFuture;
@@ -25,7 +25,8 @@ public MetadataResponseFuture(
     this.mapper = null;
   }
 
-  public MetadataResponseFuture(Future<HttpResponse> underlyingFuture, ResponseMapper mapper) {
+  public MetadataResponseFuture(
+      Future<SimpleHttpResponse> underlyingFuture, ResponseMapper mapper) {
     this.requestFuture = underlyingFuture;
     this.responseReference = null;
     this.responseLatch = null;
@@ -50,7 +51,7 @@ public boolean isDone() {
   @SneakyThrows
   @Override
   public MetadataWriteResponse get() throws InterruptedException, ExecutionException {
-    HttpResponse response = requestFuture.get();
+    SimpleHttpResponse response = requestFuture.get();
     if (mapper != null) {
       return mapper.map(response);
     } else {
@@ -63,7 +64,7 @@ public MetadataWriteResponse get() throws InterruptedException, ExecutionExcepti
   @Override
   public MetadataWriteResponse get(long timeout, TimeUnit unit)
       throws InterruptedException, ExecutionException, TimeoutException {
-    HttpResponse response = requestFuture.get(timeout, unit);
+    SimpleHttpResponse response = requestFuture.get(timeout, unit);
     if (mapper != null) {
       return mapper.map(response);
     } else {
@@ -75,6 +76,6 @@ public MetadataWriteResponse get(long timeout, TimeUnit unit)
 
   @FunctionalInterface
   public interface ResponseMapper {
-    MetadataWriteResponse map(HttpResponse httpResponse);
+    MetadataWriteResponse map(SimpleHttpResponse httpResponse);
   }
 }
diff --git a/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/DatahubHttpRequestRetryStrategy.java b/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/DatahubHttpRequestRetryStrategy.java
new file mode 100644
index 00000000000000..71a4b93baf48f4
--- /dev/null
+++ b/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/DatahubHttpRequestRetryStrategy.java
@@ -0,0 +1,54 @@
+package datahub.client.rest;
+
+import java.io.IOException;
+import java.io.InterruptedIOException;
+import java.net.ConnectException;
+import java.net.NoRouteToHostException;
+import java.net.UnknownHostException;
+import java.util.Arrays;
+import javax.net.ssl.SSLException;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.hc.client5.http.impl.DefaultHttpRequestRetryStrategy;
+import org.apache.hc.core5.http.ConnectionClosedException;
+import org.apache.hc.core5.http.HttpRequest;
+import org.apache.hc.core5.http.HttpResponse;
+import org.apache.hc.core5.http.HttpStatus;
+import org.apache.hc.core5.http.protocol.HttpContext;
+import org.apache.hc.core5.util.TimeValue;
+
+@Slf4j
+public class DatahubHttpRequestRetryStrategy extends DefaultHttpRequestRetryStrategy {
+  public DatahubHttpRequestRetryStrategy() {
+    this(1, TimeValue.ofSeconds(10));
+  }
+
+  public DatahubHttpRequestRetryStrategy(int maxRetries, TimeValue retryInterval) {
+    super(
+        maxRetries,
+        retryInterval,
+        Arrays.asList(
+            InterruptedIOException.class,
+            UnknownHostException.class,
+            ConnectException.class,
+            ConnectionClosedException.class,
+            NoRouteToHostException.class,
+            SSLException.class),
+        Arrays.asList(
+            HttpStatus.SC_TOO_MANY_REQUESTS,
+            HttpStatus.SC_SERVICE_UNAVAILABLE,
+            HttpStatus.SC_INTERNAL_SERVER_ERROR));
+  }
+
+  @Override
+  public boolean retryRequest(
+      HttpRequest request, IOException exception, int execCount, HttpContext context) {
+    log.warn("Checking if retry is needed: {}", execCount);
+    return super.retryRequest(request, exception, execCount, context);
+  }
+
+  @Override
+  public boolean retryRequest(HttpResponse response, int execCount, HttpContext context) {
+    log.warn("Retrying request due to error: {}", response);
+    return super.retryRequest(response, execCount, context);
+  }
+}
diff --git a/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitter.java b/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitter.java
index a2692c432513e0..ed4cee060bd699 100644
--- a/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitter.java
+++ b/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitter.java
@@ -18,31 +18,35 @@
 import datahub.event.UpsertAspectRequest;
 import java.io.ByteArrayOutputStream;
 import java.io.IOException;
-import java.io.InputStream;
 import java.security.KeyManagementException;
 import java.security.KeyStoreException;
 import java.security.NoSuchAlgorithmException;
 import java.util.List;
+import java.util.Objects;
 import java.util.concurrent.CountDownLatch;
 import java.util.concurrent.ExecutionException;
 import java.util.concurrent.Future;
 import java.util.concurrent.atomic.AtomicReference;
 import java.util.function.Consumer;
 import javax.annotation.concurrent.ThreadSafe;
+import javax.net.ssl.SSLContext;
 import lombok.extern.slf4j.Slf4j;
-import org.apache.http.HttpResponse;
-import org.apache.http.HttpStatus;
-import org.apache.http.client.config.RequestConfig;
-import org.apache.http.client.methods.HttpGet;
-import org.apache.http.client.methods.HttpPost;
-import org.apache.http.concurrent.FutureCallback;
-import org.apache.http.conn.ssl.NoopHostnameVerifier;
-import org.apache.http.conn.ssl.TrustAllStrategy;
-import org.apache.http.entity.StringEntity;
-import org.apache.http.impl.nio.client.CloseableHttpAsyncClient;
-import org.apache.http.impl.nio.client.HttpAsyncClientBuilder;
-import org.apache.http.nio.client.HttpAsyncClient;
-import org.apache.http.ssl.SSLContextBuilder;
+import org.apache.hc.client5.http.async.methods.SimpleHttpRequest;
+import org.apache.hc.client5.http.async.methods.SimpleHttpResponse;
+import org.apache.hc.client5.http.async.methods.SimpleRequestBuilder;
+import org.apache.hc.client5.http.config.RequestConfig;
+import org.apache.hc.client5.http.impl.async.CloseableHttpAsyncClient;
+import org.apache.hc.client5.http.impl.async.HttpAsyncClientBuilder;
+import org.apache.hc.client5.http.impl.nio.PoolingAsyncClientConnectionManagerBuilder;
+import org.apache.hc.client5.http.ssl.ClientTlsStrategyBuilder;
+import org.apache.hc.client5.http.ssl.NoopHostnameVerifier;
+import org.apache.hc.client5.http.ssl.TrustAllStrategy;
+import org.apache.hc.core5.concurrent.FutureCallback;
+import org.apache.hc.core5.http.ContentType;
+import org.apache.hc.core5.http.HttpStatus;
+import org.apache.hc.core5.http.nio.ssl.TlsStrategy;
+import org.apache.hc.core5.ssl.SSLContexts;
+import org.apache.hc.core5.util.TimeValue;
 
 @ThreadSafe
 @Slf4j
@@ -89,28 +93,43 @@ public RestEmitter(RestEmitterConfig config) {
     dataTemplateCodec = new JacksonDataTemplateCodec(objectMapper.getFactory());
 
     this.config = config;
+    HttpAsyncClientBuilder httpClientBuilder = this.config.getAsyncHttpClientBuilder();
+    httpClientBuilder.setRetryStrategy(new DatahubHttpRequestRetryStrategy());
+
     // Override httpClient settings with RestEmitter configs if present
     if (config.getTimeoutSec() != null) {
-      HttpAsyncClientBuilder httpClientBuilder = this.config.getAsyncHttpClientBuilder();
       httpClientBuilder.setDefaultRequestConfig(
           RequestConfig.custom()
-              .setConnectTimeout(config.getTimeoutSec() * 1000)
-              .setSocketTimeout(config.getTimeoutSec() * 1000)
+              .setConnectionRequestTimeout(
+                  config.getTimeoutSec() * 1000, java.util.concurrent.TimeUnit.MILLISECONDS)
+              .setResponseTimeout(
+                  config.getTimeoutSec() * 1000, java.util.concurrent.TimeUnit.MILLISECONDS)
               .build());
     }
     if (config.isDisableSslVerification()) {
-      HttpAsyncClientBuilder httpClientBuilder = this.config.getAsyncHttpClientBuilder();
       try {
-        httpClientBuilder
-            .setSSLContext(
-                new SSLContextBuilder().loadTrustMaterial(null, TrustAllStrategy.INSTANCE).build())
-            .setSSLHostnameVerifier(NoopHostnameVerifier.INSTANCE);
+        SSLContext sslcontext =
+            SSLContexts.custom().loadTrustMaterial(TrustAllStrategy.INSTANCE).build();
+        TlsStrategy tlsStrategy =
+            ClientTlsStrategyBuilder.create()
+                .setSslContext(sslcontext)
+                .setHostnameVerifier(NoopHostnameVerifier.INSTANCE)
+                .build();
+
+        httpClientBuilder.setConnectionManager(
+            PoolingAsyncClientConnectionManagerBuilder.create()
+                .setTlsStrategy(tlsStrategy)
+                .build());
       } catch (KeyManagementException | NoSuchAlgorithmException | KeyStoreException e) {
         throw new RuntimeException("Error while creating insecure http client", e);
       }
     }
 
-    this.httpClient = this.config.getAsyncHttpClientBuilder().build();
+    httpClientBuilder.setRetryStrategy(
+        new DatahubHttpRequestRetryStrategy(
+            config.getMaxRetries(), TimeValue.ofSeconds(config.getRetryIntervalSec())));
+
+    this.httpClient = httpClientBuilder.build();
     this.httpClient.start();
     this.ingestProposalUrl = this.config.getServer() + "/aspects?action=ingestProposal";
     this.ingestOpenApiUrl = config.getServer() + "/openapi/entities/v1/";
@@ -118,13 +137,11 @@ public RestEmitter(RestEmitterConfig config) {
     this.eventFormatter = this.config.getEventFormatter();
   }
 
-  private static MetadataWriteResponse mapResponse(HttpResponse response) {
+  private static MetadataWriteResponse mapResponse(SimpleHttpResponse response) {
     MetadataWriteResponse.MetadataWriteResponseBuilder builder =
         MetadataWriteResponse.builder().underlyingResponse(response);
-    if ((response != null)
-        && (response.getStatusLine() != null)
-        && (response.getStatusLine().getStatusCode() == HttpStatus.SC_OK
-            || response.getStatusLine().getStatusCode() == HttpStatus.SC_CREATED)) {
+    if ((response != null) && (response.getCode()) == HttpStatus.SC_OK
+        || Objects.requireNonNull(response).getCode() == HttpStatus.SC_CREATED) {
       builder.success(true);
     } else {
       builder.success(false);
@@ -132,14 +149,7 @@ private static MetadataWriteResponse mapResponse(HttpResponse response) {
     // Read response content
     try {
       ByteArrayOutputStream result = new ByteArrayOutputStream();
-      InputStream contentStream = response.getEntity().getContent();
-      byte[] buffer = new byte[1024];
-      int length = contentStream.read(buffer);
-      while (length > 0) {
-        result.write(buffer, 0, length);
-        length = contentStream.read(buffer);
-      }
-      builder.responseContent(result.toString("UTF-8"));
+      builder.responseContent(response.getBody().getBodyText());
     } catch (Exception e) {
       // Catch all exceptions and still return a valid response object
       log.warn("Wasn't able to convert response into a string", e);
@@ -198,21 +208,22 @@ public Future<MetadataWriteResponse> emit(MetadataChangeProposal mcp, Callback c
   private Future<MetadataWriteResponse> postGeneric(
       String urlStr, String payloadJson, Object originalRequest, Callback callback)
       throws IOException {
-    HttpPost httpPost = new HttpPost(urlStr);
-    httpPost.setHeader("Content-Type", "application/json");
-    httpPost.setHeader("X-RestLi-Protocol-Version", "2.0.0");
-    httpPost.setHeader("Accept", "application/json");
-    this.config.getExtraHeaders().forEach((k, v) -> httpPost.setHeader(k, v));
+    SimpleRequestBuilder simpleRequestBuilder = SimpleRequestBuilder.post(urlStr);
+    simpleRequestBuilder.setHeader("Content-Type", "application/json");
+    simpleRequestBuilder.setHeader("X-RestLi-Protocol-Version", "2.0.0");
+    simpleRequestBuilder.setHeader("Accept", "application/json");
+    this.config.getExtraHeaders().forEach(simpleRequestBuilder::setHeader);
     if (this.config.getToken() != null) {
-      httpPost.setHeader("Authorization", "Bearer " + this.config.getToken());
+      simpleRequestBuilder.setHeader("Authorization", "Bearer " + this.config.getToken());
     }
-    httpPost.setEntity(new StringEntity(payloadJson));
+
+    simpleRequestBuilder.setBody(payloadJson, ContentType.APPLICATION_JSON);
     AtomicReference<MetadataWriteResponse> responseAtomicReference = new AtomicReference<>();
     CountDownLatch responseLatch = new CountDownLatch(1);
-    FutureCallback<HttpResponse> httpCallback =
-        new FutureCallback<HttpResponse>() {
+    FutureCallback<SimpleHttpResponse> httpCallback =
+        new FutureCallback<SimpleHttpResponse>() {
           @Override
-          public void completed(HttpResponse response) {
+          public void completed(SimpleHttpResponse response) {
             MetadataWriteResponse writeResponse = null;
             try {
               writeResponse = mapResponse(response);
@@ -252,16 +263,20 @@ public void cancelled() {
             }
           }
         };
-    Future<HttpResponse> requestFuture = httpClient.execute(httpPost, httpCallback);
+    Future<SimpleHttpResponse> requestFuture =
+        httpClient.execute(simpleRequestBuilder.build(), httpCallback);
     return new MetadataResponseFuture(requestFuture, responseAtomicReference, responseLatch);
   }
 
   private Future<MetadataWriteResponse> getGeneric(String urlStr) throws IOException {
-    HttpGet httpGet = new HttpGet(urlStr);
-    httpGet.setHeader("Content-Type", "application/json");
-    httpGet.setHeader("X-RestLi-Protocol-Version", "2.0.0");
-    httpGet.setHeader("Accept", "application/json");
-    Future<HttpResponse> response = this.httpClient.execute(httpGet, null);
+    SimpleHttpRequest simpleHttpRequest =
+        SimpleRequestBuilder.get(urlStr)
+            .addHeader("Content-Type", "application/json")
+            .addHeader("X-RestLi-Protocol-Version", "2.0.0")
+            .addHeader("Accept", "application/json")
+            .build();
+
+    Future<SimpleHttpResponse> response = this.httpClient.execute(simpleHttpRequest, null);
     return new MetadataResponseFuture(response, RestEmitter::mapResponse);
   }
 
@@ -284,20 +299,25 @@ public Future<MetadataWriteResponse> emit(List<UpsertAspectRequest> request, Cal
 
   private Future<MetadataWriteResponse> postOpenAPI(
       List<UpsertAspectRequest> payload, Callback callback) throws IOException {
-    HttpPost httpPost = new HttpPost(ingestOpenApiUrl);
-    httpPost.setHeader("Content-Type", "application/json");
-    httpPost.setHeader("Accept", "application/json");
-    this.config.getExtraHeaders().forEach((k, v) -> httpPost.setHeader(k, v));
+    SimpleRequestBuilder simpleRequestBuilder =
+        SimpleRequestBuilder.post(ingestOpenApiUrl)
+            .addHeader("Content-Type", "application/json")
+            .addHeader("Accept", "application/json")
+            .addHeader("X-RestLi-Protocol-Version", "2.0.0");
+
+    this.config.getExtraHeaders().forEach(simpleRequestBuilder::addHeader);
+
     if (this.config.getToken() != null) {
-      httpPost.setHeader("Authorization", "Bearer " + this.config.getToken());
+      simpleRequestBuilder.addHeader("Authorization", "Bearer " + this.config.getToken());
     }
-    httpPost.setEntity(new StringEntity(objectMapper.writeValueAsString(payload)));
+    simpleRequestBuilder.setBody(
+        objectMapper.writeValueAsString(payload), ContentType.APPLICATION_JSON);
     AtomicReference<MetadataWriteResponse> responseAtomicReference = new AtomicReference<>();
     CountDownLatch responseLatch = new CountDownLatch(1);
-    FutureCallback<HttpResponse> httpCallback =
-        new FutureCallback<HttpResponse>() {
+    FutureCallback<SimpleHttpResponse> httpCallback =
+        new FutureCallback<SimpleHttpResponse>() {
           @Override
-          public void completed(HttpResponse response) {
+          public void completed(SimpleHttpResponse response) {
             MetadataWriteResponse writeResponse = null;
             try {
               writeResponse = mapResponse(response);
@@ -337,12 +357,13 @@ public void cancelled() {
             }
           }
         };
-    Future<HttpResponse> requestFuture = httpClient.execute(httpPost, httpCallback);
+    Future<SimpleHttpResponse> requestFuture =
+        httpClient.execute(simpleRequestBuilder.build(), httpCallback);
     return new MetadataResponseFuture(requestFuture, responseAtomicReference, responseLatch);
   }
 
   @VisibleForTesting
-  HttpAsyncClient getHttpClient() {
+  CloseableHttpAsyncClient getHttpClient() {
     return this.httpClient;
   }
 }
diff --git a/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitterConfig.java b/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitterConfig.java
index 7e244292132468..e28ad4ed660f0b 100644
--- a/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitterConfig.java
+++ b/metadata-integration/java/datahub-client/src/main/java/datahub/client/rest/RestEmitterConfig.java
@@ -10,8 +10,10 @@
 import lombok.NonNull;
 import lombok.Value;
 import lombok.extern.slf4j.Slf4j;
-import org.apache.http.client.config.RequestConfig;
-import org.apache.http.impl.nio.client.HttpAsyncClientBuilder;
+import org.apache.hc.client5.http.config.RequestConfig;
+import org.apache.hc.client5.http.impl.async.HttpAsyncClientBuilder;
+import org.apache.hc.client5.http.impl.async.HttpAsyncClients;
+import org.apache.hc.core5.util.TimeValue;
 
 @Value
 @Builder
@@ -23,20 +25,23 @@ public class RestEmitterConfig {
   public static final String DEFAULT_AUTH_TOKEN = null;
   public static final String CLIENT_VERSION_PROPERTY = "clientVersion";
 
-  @Builder.Default private final String server = "http://localhost:8080";
+  @Builder.Default String server = "http://localhost:8080";
 
-  private final Integer timeoutSec;
-  @Builder.Default private final boolean disableSslVerification = false;
+  Integer timeoutSec;
+  @Builder.Default boolean disableSslVerification = false;
 
-  @Builder.Default private final String token = DEFAULT_AUTH_TOKEN;
+  @Builder.Default int maxRetries = 0;
 
-  @Builder.Default @NonNull private final Map<String, String> extraHeaders = Collections.EMPTY_MAP;
+  @Builder.Default int retryIntervalSec = 10;
 
-  private final HttpAsyncClientBuilder asyncHttpClientBuilder;
+  @Builder.Default String token = DEFAULT_AUTH_TOKEN;
+
+  @Builder.Default @NonNull Map<String, String> extraHeaders = Collections.EMPTY_MAP;
 
   @Builder.Default
-  private final EventFormatter eventFormatter =
-      new EventFormatter(EventFormatter.Format.PEGASUS_JSON);
+  EventFormatter eventFormatter = new EventFormatter(EventFormatter.Format.PEGASUS_JSON);
+
+  HttpAsyncClientBuilder asyncHttpClientBuilder;
 
   public static class RestEmitterConfigBuilder {
 
@@ -53,13 +58,19 @@ private String getVersion() {
     }
 
     private HttpAsyncClientBuilder asyncHttpClientBuilder =
-        HttpAsyncClientBuilder.create()
+        HttpAsyncClients.custom()
+            .setUserAgent("DataHub-RestClient/" + getVersion())
             .setDefaultRequestConfig(
                 RequestConfig.custom()
-                    .setConnectTimeout(DEFAULT_CONNECT_TIMEOUT_SEC * 1000)
-                    .setSocketTimeout(DEFAULT_READ_TIMEOUT_SEC * 1000)
+                    .setConnectionRequestTimeout(
+                        DEFAULT_CONNECT_TIMEOUT_SEC * 1000,
+                        java.util.concurrent.TimeUnit.MILLISECONDS)
+                    .setResponseTimeout(
+                        DEFAULT_READ_TIMEOUT_SEC * 1000, java.util.concurrent.TimeUnit.MILLISECONDS)
                     .build())
-            .setUserAgent("DataHub-RestClient/" + getVersion());
+            .setRetryStrategy(
+                new DatahubHttpRequestRetryStrategy(
+                    maxRetries$value, TimeValue.ofSeconds(retryIntervalSec$value)));
 
     public RestEmitterConfigBuilder with(Consumer<RestEmitterConfigBuilder> builderFunction) {
       builderFunction.accept(this);
diff --git a/metadata-integration/java/datahub-client/src/test/java/datahub/client/rest/RestEmitterTest.java b/metadata-integration/java/datahub-client/src/test/java/datahub/client/rest/RestEmitterTest.java
index 657669d19439ce..a22b2736e750df 100644
--- a/metadata-integration/java/datahub-client/src/test/java/datahub/client/rest/RestEmitterTest.java
+++ b/metadata-integration/java/datahub-client/src/test/java/datahub/client/rest/RestEmitterTest.java
@@ -11,8 +11,8 @@
 import datahub.event.MetadataChangeProposalWrapper;
 import datahub.server.TestDataHubServer;
 import java.io.IOException;
-import java.io.InputStream;
 import java.net.SocketTimeoutException;
+import java.net.URI;
 import java.net.URISyntaxException;
 import java.nio.charset.StandardCharsets;
 import java.util.ArrayList;
@@ -32,117 +32,148 @@
 import java.util.concurrent.atomic.AtomicReference;
 import java.util.stream.Collectors;
 import javax.net.ssl.SSLHandshakeException;
-import org.apache.http.HttpResponse;
-import org.apache.http.client.methods.HttpGet;
-import org.apache.http.client.methods.HttpPost;
-import org.apache.http.concurrent.FutureCallback;
-import org.apache.http.impl.nio.client.CloseableHttpAsyncClient;
-import org.apache.http.impl.nio.client.HttpAsyncClientBuilder;
+import org.apache.hc.client5.http.async.methods.SimpleHttpRequest;
+import org.apache.hc.client5.http.async.methods.SimpleHttpResponse;
+import org.apache.hc.core5.http.Method;
 import org.junit.Assert;
-import org.junit.Before;
 import org.junit.Test;
 import org.junit.runner.RunWith;
-import org.mockito.ArgumentCaptor;
-import org.mockito.Captor;
-import org.mockito.Mock;
-import org.mockito.Mockito;
 import org.mockito.junit.MockitoJUnitRunner;
 import org.mockserver.matchers.Times;
+import org.mockserver.model.HttpError;
 import org.mockserver.model.HttpRequest;
+import org.mockserver.model.HttpResponse;
+import org.mockserver.model.HttpStatusCode;
 import org.mockserver.model.RequestDefinition;
+import org.mockserver.verify.VerificationTimes;
 
 @RunWith(MockitoJUnitRunner.class)
 public class RestEmitterTest {
 
-  @Mock HttpAsyncClientBuilder mockHttpClientFactory;
-
-  @Mock CloseableHttpAsyncClient mockClient;
-
-  @Captor ArgumentCaptor<HttpPost> postArgumentCaptor;
-
-  @Captor ArgumentCaptor<FutureCallback> callbackCaptor;
+  @Test
+  public void testPost()
+      throws URISyntaxException, IOException, ExecutionException, InterruptedException {
+    TestDataHubServer testDataHubServer = new TestDataHubServer();
+    Integer port = testDataHubServer.getMockServer().getPort();
+    RestEmitter emitter = RestEmitter.create(b -> b.server("http://localhost:" + port));
 
-  @Before
-  public void setupMocks() {
-    Mockito.when(mockHttpClientFactory.build()).thenReturn(mockClient);
+    MetadataChangeProposalWrapper mcp =
+        getMetadataChangeProposalWrapper(
+            "Test Dataset", "urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)");
+    Future<MetadataWriteResponse> future = emitter.emit(mcp, null);
+    MetadataWriteResponse response = future.get();
+    String expectedContent =
+        "{\"proposal\":{\"aspectName\":\"datasetProperties\","
+            + "\"entityUrn\":\"urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)\","
+            + "\"entityType\":\"dataset\",\"changeType\":\"UPSERT\",\"aspect\":{\"contentType\":\"application/json\""
+            + ",\"value\":\"{\\\"description\\\":\\\"Test Dataset\\\"}\"}}}";
+    testDataHubServer
+        .getMockServer()
+        .verify(
+            request().withHeader("X-RestLi-Protocol-Version", "2.0.0").withBody(expectedContent));
   }
 
   @Test
-  public void testPost() throws URISyntaxException, IOException {
+  public void testPostWithRetry()
+      throws URISyntaxException, IOException, ExecutionException, InterruptedException {
+    TestDataHubServer testDataHubServer = new TestDataHubServer();
+    Integer port = testDataHubServer.getMockServer().getPort();
+    RestEmitterConfig config =
+        RestEmitterConfig.builder()
+            .server("http://localhost:" + port)
+            .maxRetries(3)
+            .retryIntervalSec(1)
+            .build();
+    RestEmitter emitter = new RestEmitter(config);
 
-    RestEmitter emitter = RestEmitter.create(b -> b.asyncHttpClientBuilder(mockHttpClientFactory));
     MetadataChangeProposalWrapper mcp =
         getMetadataChangeProposalWrapper(
             "Test Dataset", "urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)");
-    emitter.emit(mcp, null);
-    Mockito.verify(mockClient).execute(postArgumentCaptor.capture(), callbackCaptor.capture());
-    FutureCallback callback = callbackCaptor.getValue();
-    Assert.assertNotNull(callback);
-    HttpPost testPost = postArgumentCaptor.getValue();
-    Assert.assertEquals("2.0.0", testPost.getFirstHeader("X-RestLi-Protocol-Version").getValue());
-    InputStream is = testPost.getEntity().getContent();
-    byte[] contentBytes = new byte[(int) testPost.getEntity().getContentLength()];
-    is.read(contentBytes);
-    String contentString = new String(contentBytes, StandardCharsets.UTF_8);
+    Future<MetadataWriteResponse> future = emitter.emit(mcp, null);
+    MetadataWriteResponse response = future.get();
     String expectedContent =
         "{\"proposal\":{\"aspectName\":\"datasetProperties\","
             + "\"entityUrn\":\"urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)\","
             + "\"entityType\":\"dataset\",\"changeType\":\"UPSERT\",\"aspect\":{\"contentType\":\"application/json\""
             + ",\"value\":\"{\\\"description\\\":\\\"Test Dataset\\\"}\"}}}";
-    Assert.assertEquals(expectedContent, contentString);
+    testDataHubServer
+        .getMockServer()
+        .verify(
+            request().withHeader("X-RestLi-Protocol-Version", "2.0.0").withBody(expectedContent),
+            VerificationTimes.exactly(1))
+        .when(
+            request()
+                .withPath("/aspect")
+                .withHeader("X-RestLi-Protocol-Version", "2.0.0")
+                .withBody(expectedContent),
+            Times.exactly(4))
+        .respond(HttpResponse.response().withStatusCode(500).withBody("exception"));
   }
 
   @Test
   public void testExceptions()
       throws URISyntaxException, IOException, ExecutionException, InterruptedException {
-
-    RestEmitter emitter = RestEmitter.create($ -> $.asyncHttpClientBuilder(mockHttpClientFactory));
+    TestDataHubServer testDataHubServer = new TestDataHubServer();
+    Integer port = testDataHubServer.getMockServer().getPort();
+    RestEmitter emitter =
+        RestEmitter.create(
+            b ->
+                b.server("http://localhost:" + port)
+                    .extraHeaders(Collections.singletonMap("Test-Header", "Test-Value")));
 
     MetadataChangeProposalWrapper mcp =
-        MetadataChangeProposalWrapper.create(
-            b ->
-                b.entityType("dataset")
-                    .entityUrn("urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)")
-                    .upsert()
-                    .aspect(new DatasetProperties().setDescription("Test Dataset")));
-
-    Future<HttpResponse> mockFuture = Mockito.mock(Future.class);
-    Mockito.when(mockClient.execute(Mockito.any(), Mockito.any())).thenReturn(mockFuture);
-    Mockito.when(mockFuture.get())
-        .thenThrow(new ExecutionException("Test execution exception", null));
+        getMetadataChangeProposalWrapper(
+            "Test Dataset", "urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)");
+    Future<MetadataWriteResponse> future = emitter.emit(mcp, null);
+    MetadataWriteResponse response = future.get();
+    String expectedContent =
+        "{\"proposal\":{\"aspectName\":\"datasetProperties\","
+            + "\"entityUrn\":\"urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)\","
+            + "\"entityType\":\"dataset\",\"changeType\":\"UPSERT\",\"aspect\":{\"contentType\":\"application/json\""
+            + ",\"value\":\"{\\\"description\\\":\\\"Test Dataset\\\"}\"}}}";
+    testDataHubServer
+        .getMockServer()
+        .when(request(), Times.once())
+        .error(HttpError.error().withDropConnection(true));
+
     try {
       emitter.emit(mcp, null).get();
       Assert.fail("should not be here");
     } catch (ExecutionException e) {
-      Assert.assertEquals(e.getMessage(), "Test execution exception");
+      Assert.assertEquals(
+          e.getMessage(),
+          "org.apache.hc.core5.http.ConnectionClosedException: Connection closed by peer");
     }
   }
 
   @Test
-  public void testExtraHeaders() throws Exception {
+  public void testExtraHeaders()
+      throws URISyntaxException, IOException, ExecutionException, InterruptedException {
+    TestDataHubServer testDataHubServer = new TestDataHubServer();
+    Integer port = testDataHubServer.getMockServer().getPort();
     RestEmitter emitter =
         RestEmitter.create(
             b ->
-                b.asyncHttpClientBuilder(mockHttpClientFactory)
+                b.server("http://localhost:" + port)
                     .extraHeaders(Collections.singletonMap("Test-Header", "Test-Value")));
-    MetadataChangeProposalWrapper mcpw =
-        MetadataChangeProposalWrapper.create(
-            b ->
-                b.entityType("dataset")
-                    .entityUrn("urn:li:dataset:foo")
-                    .upsert()
-                    .aspect(new DatasetProperties()));
-    Future<HttpResponse> mockFuture = Mockito.mock(Future.class);
-    Mockito.when(mockClient.execute(Mockito.any(), Mockito.any())).thenReturn(mockFuture);
-    emitter.emit(mcpw, null);
-    Mockito.verify(mockClient).execute(postArgumentCaptor.capture(), callbackCaptor.capture());
-    FutureCallback callback = callbackCaptor.getValue();
-    Assert.assertNotNull(callback);
-    HttpPost testPost = postArgumentCaptor.getValue();
-    // old headers are not modified
-    Assert.assertEquals("2.0.0", testPost.getFirstHeader("X-RestLi-Protocol-Version").getValue());
-    // new headers are added
-    Assert.assertEquals("Test-Value", testPost.getFirstHeader("Test-Header").getValue());
+
+    MetadataChangeProposalWrapper mcp =
+        getMetadataChangeProposalWrapper(
+            "Test Dataset", "urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)");
+    Future<MetadataWriteResponse> future = emitter.emit(mcp, null);
+    MetadataWriteResponse response = future.get();
+    String expectedContent =
+        "{\"proposal\":{\"aspectName\":\"datasetProperties\","
+            + "\"entityUrn\":\"urn:li:dataset:(urn:li:dataPlatform:hive,foo.bar,PROD)\","
+            + "\"entityType\":\"dataset\",\"changeType\":\"UPSERT\",\"aspect\":{\"contentType\":\"application/json\""
+            + ",\"value\":\"{\\\"description\\\":\\\"Test Dataset\\\"}\"}}}";
+    testDataHubServer
+        .getMockServer()
+        .verify(
+            request()
+                .withHeader("Test-Header", "Test-Value")
+                .withHeader("X-RestLi-Protocol-Version", "2.0.0")
+                .withBody(expectedContent));
   }
 
   @Test
@@ -168,7 +199,7 @@ public void multithreadedTestExecutors() throws Exception {
                 .withQueryStringParameter("action", "ingestProposal")
                 .withHeader("Content-type", "application/json"),
             Times.unlimited())
-        .respond(org.mockserver.model.HttpResponse.response().withStatusCode(200));
+        .respond(HttpResponse.response().withStatusCode(200));
     ExecutorService executor = Executors.newFixedThreadPool(10);
     ArrayList<Future> results = new ArrayList();
     Random random = new Random();
@@ -476,26 +507,27 @@ public void testUserAgentHeader() throws IOException, ExecutionException, Interr
 
   @Test
   public void testDisableSslVerification()
-      throws IOException, InterruptedException, ExecutionException {
+      throws IOException, InterruptedException, ExecutionException, URISyntaxException {
     RestEmitter restEmitter =
         new RestEmitter(RestEmitterConfig.builder().disableSslVerification(true).build());
     final String hostWithSsl = "https://self-signed.badssl.com";
-    final HttpGet request = new HttpGet(hostWithSsl);
+    final SimpleHttpRequest request = SimpleHttpRequest.create(Method.GET, new URI(hostWithSsl));
 
-    final HttpResponse response = restEmitter.getHttpClient().execute(request, null).get();
+    final SimpleHttpResponse response = restEmitter.getHttpClient().execute(request, null).get();
     restEmitter.close();
-    Assert.assertEquals(200, response.getStatusLine().getStatusCode());
+    Assert.assertEquals(HttpStatusCode.OK_200.code(), response.getCode());
   }
 
   @Test
   public void testSslVerificationException()
-      throws IOException, InterruptedException, ExecutionException {
+      throws IOException, InterruptedException, ExecutionException, URISyntaxException {
     RestEmitter restEmitter =
         new RestEmitter(RestEmitterConfig.builder().disableSslVerification(false).build());
     final String hostWithSsl = "https://self-signed.badssl.com";
-    final HttpGet request = new HttpGet(hostWithSsl);
+    final SimpleHttpRequest request = SimpleHttpRequest.create(Method.GET, new URI(hostWithSsl));
+
     try {
-      HttpResponse response = restEmitter.getHttpClient().execute(request, null).get();
+      SimpleHttpResponse response = restEmitter.getHttpClient().execute(request, null).get();
       Assert.fail();
     } catch (Exception e) {
       Assert.assertTrue(e instanceof ExecutionException);
diff --git a/metadata-integration/java/datahub-event/build.gradle b/metadata-integration/java/datahub-event/build.gradle
index a516b9d43da4b9..395065404d1db8 100644
--- a/metadata-integration/java/datahub-event/build.gradle
+++ b/metadata-integration/java/datahub-event/build.gradle
@@ -25,7 +25,7 @@ dependencies {
   testImplementation externalDependency.testng
   testImplementation externalDependency.mockito
   testImplementation externalDependency.testContainers
-  testImplementation externalDependency.httpAsyncClient
+  testImplementation externalDependency.httpClient
   testRuntimeOnly externalDependency.logbackClassicJava8
 }
 
diff --git a/metadata-integration/java/openlineage-converter/src/main/java/io/datahubproject/openlineage/converter/OpenLineageToDataHub.java b/metadata-integration/java/openlineage-converter/src/main/java/io/datahubproject/openlineage/converter/OpenLineageToDataHub.java
index 038e8d33a97c44..59cac8719c303a 100644
--- a/metadata-integration/java/openlineage-converter/src/main/java/io/datahubproject/openlineage/converter/OpenLineageToDataHub.java
+++ b/metadata-integration/java/openlineage-converter/src/main/java/io/datahubproject/openlineage/converter/OpenLineageToDataHub.java
@@ -621,6 +621,11 @@ private static void processParentJob(
 
   private static void processJobInputs(
       DatahubJob datahubJob, OpenLineage.RunEvent event, DatahubOpenlineageConfig datahubConf) {
+
+    if (event.getInputs() == null) {
+      return;
+    }
+
     for (OpenLineage.InputDataset input :
         event.getInputs().stream()
             .filter(input -> input.getFacets() != null)
@@ -646,6 +651,11 @@ private static void processJobInputs(
 
   private static void processJobOutputs(
       DatahubJob datahubJob, OpenLineage.RunEvent event, DatahubOpenlineageConfig datahubConf) {
+
+    if (event.getOutputs() == null) {
+      return;
+    }
+
     for (OpenLineage.OutputDataset output :
         event.getOutputs().stream()
             .filter(input -> input.getFacets() != null)
diff --git a/metadata-integration/java/spark-lineage-beta/README.md b/metadata-integration/java/spark-lineage-beta/README.md
index 6a520071ba7978..e09bc3938b6868 100644
--- a/metadata-integration/java/spark-lineage-beta/README.md
+++ b/metadata-integration/java/spark-lineage-beta/README.md
@@ -24,7 +24,7 @@ When running jobs using spark-submit, the agent needs to be configured in the co
 
 ```text
 #Configuring DataHub spark agent jar
-spark.jars.packages                          io.acryl:acryl-spark-lineage:0.2.1
+spark.jars.packages                          io.acryl:acryl-spark-lineage:0.2.3
 spark.extraListeners                         datahub.spark.DatahubSparkListener
 spark.datahub.rest.server                    http://localhost:8080
 ```
@@ -32,7 +32,7 @@ spark.datahub.rest.server                    http://localhost:8080
 ## spark-submit command line
 
 ```sh
-spark-submit --packages io.acryl:acryl-spark-lineage:0.2.1 --conf "spark.extraListeners=datahub.spark.DatahubSparkListener" my_spark_job_to_run.py
+spark-submit --packages io.acryl:acryl-spark-lineage:0.2.3 --conf "spark.extraListeners=datahub.spark.DatahubSparkListener" my_spark_job_to_run.py
 ```
 
 ### Configuration Instructions:  Amazon EMR
@@ -41,7 +41,7 @@ Set the following spark-defaults configuration properties as it
 stated [here](https://docs.aws.amazon.com/emr/latest/ReleaseGuide/emr-spark-configure.html)
 
 ```text
-spark.jars.packages                          io.acryl:acryl-spark-lineage:0.2.1
+spark.jars.packages                          io.acryl:acryl-spark-lineage:0.2.3
 spark.extraListeners                         datahub.spark.DatahubSparkListener
 spark.datahub.rest.server                    https://your_datahub_host/gms
 #If you have authentication set up then you also need to specify the Datahub access token
@@ -56,7 +56,7 @@ When running interactive jobs from a notebook, the listener can be configured wh
 spark = SparkSession.builder
 .master("spark://spark-master:7077")
 .appName("test-application")
-.config("spark.jars.packages", "io.acryl:acryl-spark-lineage:0.1.0")
+.config("spark.jars.packages", "io.acryl:acryl-spark-lineage:0.2.3")
 .config("spark.extraListeners", "datahub.spark.DatahubSparkListener")
 .config("spark.datahub.rest.server", "http://localhost:8080")
 .enableHiveSupport()
@@ -79,7 +79,7 @@ appName("test-application")
 config("spark.master","spark://spark-master:7077")
         .
 
-config("spark.jars.packages","io.acryl:acryl-spark-lineage:0.2.1")
+config("spark.jars.packages","io.acryl:acryl-spark-lineage:0.2.3")
         .
 
 config("spark.extraListeners","datahub.spark.DatahubSparkListener")
@@ -164,6 +164,8 @@ information like tokens.
 | spark.datahub.rest.server                                           | ✅        |         | Datahub server url  eg:<http://localhost:8080>                                                                                                                                            |
 | spark.datahub.rest.token                                            |          |         | Authentication token.                                                                                                                                                                     |
 | spark.datahub.rest.disable_ssl_verification                         |          | false   | Disable SSL certificate validation. Caution: Only use this if you know what you are doing!                                                                                                |
+| spark.datahub.rest.rest.max_retries                                 |          | 0       | Number of times a request retried if failed                                                                                                                                               |
+| spark.datahub.rest.rest.retry_interval                              |          | 10      | Number of seconds to wait between retries                                                                                                                                                 |
 | spark.datahub.metadata.pipeline.platformInstance                    |          |         | Pipeline level platform instance                                                                                                                                                          |
 | spark.datahub.metadata.dataset.platformInstance                     |          |         | dataset level platform instance                                                                                                                                                           |
 | spark.datahub.metadata.dataset.env                                  |          | PROD    | [Supported values](https://datahubproject.io/docs/graphql/enums#fabrictype). In all other cases, will fallback to PROD                                                                    |
@@ -180,7 +182,7 @@ information like tokens.
 | spark.datahub.tags                                                  |          |         | Comma separated list of tags to attach to the DataFlow                                                                                                                                    |
 | spark.datahub.domains                                               |          |         | Comma separated list of domain urns to attach to the DataFlow                                                                                                                             |
 | spark.datahub.stage_metadata_coalescing                             |          |         | Normally it coalesce and send metadata at the onApplicationEnd event which is never called on Databricsk. You should enable this on Databricks if you want coalesced run .                |
-| spark.datahub.patch.enabled                                         |          |         | Set this to true to send lineage as a patch, which appends rather than overwrites existing Dataset lineage edges. By default it is enabled.
+| spark.datahub.patch.enabled                                         |          | false   | Set this to true to send lineage as a patch, which appends rather than overwrites existing Dataset lineage edges. By default it is enabled.                                               
 |
 
 ## What to Expect: The Metadata Model
diff --git a/metadata-integration/java/spark-lineage-beta/build.gradle b/metadata-integration/java/spark-lineage-beta/build.gradle
index 4cd2ddfec3dfcf..d83753028d0b44 100644
--- a/metadata-integration/java/spark-lineage-beta/build.gradle
+++ b/metadata-integration/java/spark-lineage-beta/build.gradle
@@ -37,7 +37,7 @@ dependencies {
   provided(externalDependency.sparkSql)
   provided(externalDependency.sparkHive)
   implementation 'org.slf4j:slf4j-log4j12:2.0.7'
-  implementation externalDependency.httpAsyncClient
+  implementation externalDependency.httpClient
   implementation externalDependency.logbackClassicJava8
   implementation externalDependency.typesafeConfig
   implementation externalDependency.commonsLang
@@ -53,7 +53,7 @@ dependencies {
   implementation project(path: ':metadata-integration:java:openlineage-converter', configuration: 'shadow')
 
   //implementation "io.acryl:datahub-client:0.10.2"
-  implementation "io.openlineage:openlineage-spark:$openLineageVersion"
+  implementation "io.openlineage:openlineage-spark_2.12:$openLineageVersion"
   compileOnly "org.apache.iceberg:iceberg-spark3-runtime:0.12.1"
   compileOnly "org.apache.spark:spark-sql_2.12:3.1.3"
 
@@ -123,7 +123,7 @@ shadowJar {
   relocate 'com.fasterxml.jackson', 'datahub.spark2.shaded.jackson'
   relocate 'org.slf4j', 'datahub.spark2.shaded.org.slf4j'
   //
-  relocate 'org.apache.http', 'io.acryl.shaded.http'
+  relocate 'org.apache.hc', 'io.acryl.shaded.http'
   relocate 'org.apache.commons.codec', 'datahub.spark2.shaded.o.a.c.codec'
   relocate 'org.apache.commons.compress', 'datahub.spark2.shaded.o.a.c.compress'
   relocate 'org.apache.commons.lang3', 'datahub.spark2.shaded.o.a.c.lang3'
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubEventEmitter.java b/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubEventEmitter.java
index 6b430c5c2ab262..1dc086e4af585d 100644
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubEventEmitter.java
+++ b/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubEventEmitter.java
@@ -23,8 +23,8 @@
 import io.datahubproject.openlineage.dataset.DatahubJob;
 import io.openlineage.client.OpenLineage;
 import io.openlineage.client.OpenLineageClientUtils;
-import io.openlineage.spark.agent.ArgumentParser;
 import io.openlineage.spark.agent.EventEmitter;
+import io.openlineage.spark.api.SparkOpenLineageConfig;
 import java.io.IOException;
 import java.net.URISyntaxException;
 import java.time.Instant;
@@ -44,7 +44,6 @@
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 import lombok.extern.slf4j.Slf4j;
-import org.apache.spark.SparkConf;
 import org.apache.spark.sql.streaming.StreamingQueryProgress;
 
 @Slf4j
@@ -55,10 +54,11 @@ public class DatahubEventEmitter extends EventEmitter {
   private final Map<String, MetadataChangeProposalWrapper> schemaMap = new HashMap<>();
   private SparkLineageConf datahubConf;
 
-  private EventFormatter eventFormatter = new EventFormatter();
+  private final EventFormatter eventFormatter = new EventFormatter();
 
-  public DatahubEventEmitter() throws URISyntaxException {
-    super(ArgumentParser.parse(new SparkConf()));
+  public DatahubEventEmitter(SparkOpenLineageConfig config, String applicationJobName)
+      throws URISyntaxException {
+    super(config, applicationJobName);
   }
 
   private Optional<Emitter> getEmitter() {
@@ -167,7 +167,7 @@ public List<MetadataChangeProposal> generateCoalescedMcps() {
     List<MetadataChangeProposal> mcps = new ArrayList<>();
 
     if (_datahubJobs.isEmpty()) {
-      log.warn("No lineage events to emit. Maybe the spark job finished premaraturely?");
+      log.warn("No lineage events to emit. Maybe the spark job finished prematurely?");
       return mcps;
     }
 
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubSparkListener.java b/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubSparkListener.java
index 060402723d1940..38de142c4dd171 100644
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubSparkListener.java
+++ b/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/DatahubSparkListener.java
@@ -1,6 +1,7 @@
 package datahub.spark;
 
 import static datahub.spark.conf.SparkConfigParser.*;
+import static io.openlineage.spark.agent.util.ScalaConversionUtils.*;
 
 import com.typesafe.config.Config;
 import com.typesafe.config.ConfigFactory;
@@ -10,16 +11,33 @@
 import datahub.spark.conf.SparkAppContext;
 import datahub.spark.conf.SparkConfigParser;
 import datahub.spark.conf.SparkLineageConf;
+import io.micrometer.core.instrument.MeterRegistry;
+import io.micrometer.core.instrument.Tag;
+import io.micrometer.core.instrument.Tags;
+import io.micrometer.core.instrument.composite.CompositeMeterRegistry;
+import io.openlineage.client.OpenLineageConfig;
+import io.openlineage.client.circuitBreaker.CircuitBreaker;
+import io.openlineage.client.circuitBreaker.CircuitBreakerFactory;
+import io.openlineage.client.circuitBreaker.NoOpCircuitBreaker;
+import io.openlineage.client.metrics.MicrometerProvider;
+import io.openlineage.spark.agent.ArgumentParser;
 import io.openlineage.spark.agent.OpenLineageSparkListener;
+import io.openlineage.spark.agent.Versions;
 import io.openlineage.spark.agent.lifecycle.ContextFactory;
+import io.openlineage.spark.agent.util.ScalaConversionUtils;
+import io.openlineage.spark.api.SparkOpenLineageConfig;
 import java.net.URISyntaxException;
 import java.time.Instant;
 import java.util.HashMap;
 import java.util.Map;
 import java.util.Optional;
 import java.util.Properties;
+import org.apache.spark.SparkConf;
+import org.apache.spark.SparkContext;
+import org.apache.spark.SparkContext$;
 import org.apache.spark.SparkEnv;
 import org.apache.spark.SparkEnv$;
+import org.apache.spark.package$;
 import org.apache.spark.scheduler.SparkListener;
 import org.apache.spark.scheduler.SparkListenerApplicationEnd;
 import org.apache.spark.scheduler.SparkListenerApplicationStart;
@@ -30,20 +48,28 @@
 import org.apache.spark.sql.streaming.StreamingQueryListener;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
+import scala.Function0;
+import scala.Option;
 
 public class DatahubSparkListener extends SparkListener {
   private static final Logger log = LoggerFactory.getLogger(DatahubSparkListener.class);
   private final Map<String, Instant> batchLastUpdated = new HashMap<String, Instant>();
   private final OpenLineageSparkListener listener;
-  private final DatahubEventEmitter emitter;
+  private DatahubEventEmitter emitter;
   private Config datahubConf = ConfigFactory.empty();
   private SparkAppContext appContext;
+  private static ContextFactory contextFactory;
+  private static CircuitBreaker circuitBreaker = new NoOpCircuitBreaker();
+  private static final String sparkVersion = package$.MODULE$.SPARK_VERSION();
+
+  private final Function0<Option<SparkContext>> activeSparkContext =
+      ScalaConversionUtils.toScalaFn(SparkContext$.MODULE$::getActive);
+
+  private static MeterRegistry meterRegistry;
+  private boolean isDisabled;
 
   public DatahubSparkListener() throws URISyntaxException {
     listener = new OpenLineageSparkListener();
-    emitter = new DatahubEventEmitter();
-    ContextFactory contextFactory = new ContextFactory(emitter);
-    OpenLineageSparkListener.init(contextFactory);
   }
 
   private static SparkAppContext getSparkAppContext(
@@ -61,13 +87,14 @@ private static SparkAppContext getSparkAppContext(
 
   public void onApplicationStart(SparkListenerApplicationStart applicationStart) {
     long startTime = System.currentTimeMillis();
+    initializeContextFactoryIfNotInitialized();
 
-    log.debug("Application start called");
+    log.info("Application start called");
     this.appContext = getSparkAppContext(applicationStart);
 
     listener.onApplicationStart(applicationStart);
     long elapsedTime = System.currentTimeMillis() - startTime;
-    log.debug("onApplicationStart completed successfully in {} ms", elapsedTime);
+    log.info("onApplicationStart completed successfully in {} ms", elapsedTime);
   }
 
   public Optional<DatahubEmitterConfig> initializeEmitter(Config sparkConf) {
@@ -87,6 +114,17 @@ public Optional<DatahubEmitterConfig> initializeEmitter(Config sparkConf) {
       boolean disableSslVerification =
           sparkConf.hasPath(SparkConfigParser.DISABLE_SSL_VERIFICATION_KEY)
               && sparkConf.getBoolean(SparkConfigParser.DISABLE_SSL_VERIFICATION_KEY);
+
+      int retry_interval_in_sec =
+          sparkConf.hasPath(SparkConfigParser.RETRY_INTERVAL_IN_SEC)
+              ? sparkConf.getInt(SparkConfigParser.RETRY_INTERVAL_IN_SEC)
+              : 5;
+
+      int max_retries =
+          sparkConf.hasPath(SparkConfigParser.MAX_RETRIES)
+              ? sparkConf.getInt(SparkConfigParser.MAX_RETRIES)
+              : 0;
+
       log.info(
           "REST Emitter Configuration: GMS url {}{}",
           gmsUrl,
@@ -94,14 +132,18 @@ public Optional<DatahubEmitterConfig> initializeEmitter(Config sparkConf) {
       if (token != null) {
         log.info("REST Emitter Configuration: Token {}", "XXXXX");
       }
+
       if (disableSslVerification) {
         log.warn("REST Emitter Configuration: ssl verification will be disabled.");
       }
+
       RestEmitterConfig restEmitterConf =
           RestEmitterConfig.builder()
               .server(gmsUrl)
               .token(token)
               .disableSslVerification(disableSslVerification)
+              .maxRetries(max_retries)
+              .retryIntervalSec(retry_interval_in_sec)
               .build();
       return Optional.of(new RestDatahubEmitterConfig(restEmitterConf));
     } else {
@@ -145,7 +187,12 @@ public void onApplicationEnd(SparkListenerApplicationEnd applicationEnd) {
     if (datahubConf.hasPath(STREAMING_JOB) && (datahubConf.getBoolean(STREAMING_JOB))) {
       return;
     }
-    emitter.emitCoalesced();
+    if (emitter != null) {
+      emitter.emitCoalesced();
+    } else {
+      log.warn("Emitter is not initialized, unable to emit coalesced events");
+    }
+
     long elapsedTime = System.currentTimeMillis() - startTime;
     log.debug("onApplicationEnd completed successfully in {} ms", elapsedTime);
   }
@@ -170,6 +217,8 @@ public void onJobEnd(SparkListenerJobEnd jobEnd) {
 
   public void onJobStart(SparkListenerJobStart jobStart) {
     long startTime = System.currentTimeMillis();
+    initializeContextFactoryIfNotInitialized();
+
     log.debug("Job start called");
     loadDatahubConfig(this.appContext, jobStart.properties());
     listener.onJobStart(jobStart);
@@ -227,4 +276,72 @@ public void onOtherEvent(SparkListenerEvent event) {
       log.debug("onOtherEvent completed successfully in {} ms", elapsedTime);
     }
   }
+
+  private static void initializeMetrics(OpenLineageConfig openLineageConfig) {
+    meterRegistry =
+        MicrometerProvider.addMeterRegistryFromConfig(openLineageConfig.getMetricsConfig());
+    String disabledFacets;
+    if (openLineageConfig.getFacetsConfig() != null
+        && openLineageConfig.getFacetsConfig().getDisabledFacets() != null) {
+      disabledFacets = String.join(";", openLineageConfig.getFacetsConfig().getDisabledFacets());
+    } else {
+      disabledFacets = "";
+    }
+    meterRegistry
+        .config()
+        .commonTags(
+            Tags.of(
+                Tag.of("openlineage.spark.integration.version", Versions.getVersion()),
+                Tag.of("openlineage.spark.version", sparkVersion),
+                Tag.of("openlineage.spark.disabled.facets", disabledFacets)));
+    ((CompositeMeterRegistry) meterRegistry)
+        .getRegistries()
+        .forEach(
+            r ->
+                r.config()
+                    .commonTags(
+                        Tags.of(
+                            Tag.of("openlineage.spark.integration.version", Versions.getVersion()),
+                            Tag.of("openlineage.spark.version", sparkVersion),
+                            Tag.of("openlineage.spark.disabled.facets", disabledFacets))));
+  }
+
+  private void initializeContextFactoryIfNotInitialized() {
+    if (contextFactory != null || isDisabled) {
+      return;
+    }
+    asJavaOptional(activeSparkContext.apply())
+        .ifPresent(context -> initializeContextFactoryIfNotInitialized(context.appName()));
+  }
+
+  private void initializeContextFactoryIfNotInitialized(String appName) {
+    if (contextFactory != null || isDisabled) {
+      return;
+    }
+    SparkEnv sparkEnv = SparkEnv$.MODULE$.get();
+    if (sparkEnv == null) {
+      log.warn(
+          "OpenLineage listener instantiated, but no configuration could be found. "
+              + "Lineage events will not be collected");
+      return;
+    }
+    initializeContextFactoryIfNotInitialized(sparkEnv.conf(), appName);
+  }
+
+  private void initializeContextFactoryIfNotInitialized(SparkConf sparkConf, String appName) {
+    if (contextFactory != null || isDisabled) {
+      return;
+    }
+    try {
+      SparkOpenLineageConfig config = ArgumentParser.parse(sparkConf);
+      // Needs to be done before initializing OpenLineageClient
+      initializeMetrics(config);
+      emitter = new DatahubEventEmitter(config, appName);
+      contextFactory = new ContextFactory(emitter, meterRegistry, config);
+      circuitBreaker = new CircuitBreakerFactory(config.getCircuitBreaker()).build();
+      OpenLineageSparkListener.init(contextFactory);
+    } catch (URISyntaxException e) {
+      log.error("Unable to parse OpenLineage endpoint. Lineage events will not be collected", e);
+    }
+  }
 }
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/conf/SparkConfigParser.java b/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/conf/SparkConfigParser.java
index 7e10f51feb38a4..f1af56ff888d3c 100644
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/conf/SparkConfigParser.java
+++ b/metadata-integration/java/spark-lineage-beta/src/main/java/datahub/spark/conf/SparkConfigParser.java
@@ -29,6 +29,9 @@ public class SparkConfigParser {
   public static final String GMS_URL_KEY = "rest.server";
   public static final String GMS_AUTH_TOKEN = "rest.token";
   public static final String DISABLE_SSL_VERIFICATION_KEY = "rest.disable_ssl_verification";
+  public static final String MAX_RETRIES = "rest.max_retries";
+  public static final String RETRY_INTERVAL_IN_SEC = "rest.retry_interval_in_sec";
+
   public static final String COALESCE_KEY = "coalesce_jobs";
   public static final String PATCH_ENABLED = "patch.enabled";
 
@@ -304,7 +307,7 @@ public static boolean isCoalesceEnabled(Config datahubConfig) {
 
   public static boolean isPatchEnabled(Config datahubConfig) {
     if (!datahubConfig.hasPath(PATCH_ENABLED)) {
-      return true;
+      return false;
     }
     return datahubConfig.hasPath(PATCH_ENABLED) && datahubConfig.getBoolean(PATCH_ENABLED);
   }
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/lifecycle/OpenLineageRunEventBuilder.java b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/lifecycle/OpenLineageRunEventBuilder.java
deleted file mode 100644
index 99643592dc200e..00000000000000
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/lifecycle/OpenLineageRunEventBuilder.java
+++ /dev/null
@@ -1,493 +0,0 @@
-/*
-/* Copyright 2018-2023 contributors to the OpenLineage project
-/* SPDX-License-Identifier: Apache-2.0
-*/
-
-package io.openlineage.spark.agent.lifecycle;
-
-import static io.openlineage.client.OpenLineageClientUtils.mergeFacets;
-import static io.openlineage.spark.agent.util.ScalaConversionUtils.fromSeq;
-import static io.openlineage.spark.agent.util.ScalaConversionUtils.toScalaFn;
-
-import io.openlineage.client.OpenLineage;
-import io.openlineage.client.OpenLineage.DatasetFacet;
-import io.openlineage.client.OpenLineage.DatasetFacets;
-import io.openlineage.client.OpenLineage.InputDataset;
-import io.openlineage.client.OpenLineage.InputDatasetFacet;
-import io.openlineage.client.OpenLineage.InputDatasetInputFacets;
-import io.openlineage.client.OpenLineage.JobBuilder;
-import io.openlineage.client.OpenLineage.JobFacet;
-import io.openlineage.client.OpenLineage.OutputDataset;
-import io.openlineage.client.OpenLineage.OutputDatasetFacet;
-import io.openlineage.client.OpenLineage.OutputDatasetOutputFacets;
-import io.openlineage.client.OpenLineage.ParentRunFacet;
-import io.openlineage.client.OpenLineage.RunEvent;
-import io.openlineage.client.OpenLineage.RunEventBuilder;
-import io.openlineage.client.OpenLineage.RunFacet;
-import io.openlineage.client.OpenLineage.RunFacets;
-import io.openlineage.client.OpenLineage.RunFacetsBuilder;
-import io.openlineage.spark.agent.hooks.HookUtils;
-import io.openlineage.spark.agent.lifecycle.plan.column.ColumnLevelLineageUtils;
-import io.openlineage.spark.agent.lifecycle.plan.column.ColumnLevelLineageVisitor;
-import io.openlineage.spark.agent.util.FacetUtils;
-import io.openlineage.spark.agent.util.PlanUtils;
-import io.openlineage.spark.agent.util.ScalaConversionUtils;
-import io.openlineage.spark.api.CustomFacetBuilder;
-import io.openlineage.spark.api.OpenLineageContext;
-import io.openlineage.spark.api.OpenLineageEventHandlerFactory;
-import java.util.ArrayList;
-import java.util.Arrays;
-import java.util.Collection;
-import java.util.Collections;
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
-import java.util.Optional;
-import java.util.stream.Collectors;
-import java.util.stream.Stream;
-import lombok.AllArgsConstructor;
-import lombok.NonNull;
-import lombok.extern.slf4j.Slf4j;
-import org.apache.spark.rdd.RDD;
-import org.apache.spark.scheduler.ActiveJob;
-import org.apache.spark.scheduler.JobFailed;
-import org.apache.spark.scheduler.SparkListenerJobEnd;
-import org.apache.spark.scheduler.SparkListenerJobStart;
-import org.apache.spark.scheduler.SparkListenerStageCompleted;
-import org.apache.spark.scheduler.SparkListenerStageSubmitted;
-import org.apache.spark.scheduler.Stage;
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan;
-import org.apache.spark.sql.execution.ui.SparkListenerSQLExecutionEnd;
-import org.apache.spark.sql.execution.ui.SparkListenerSQLExecutionStart;
-import scala.Function1;
-import scala.PartialFunction;
-
-/**
- * Event handler that accepts various {@link org.apache.spark.scheduler.SparkListener} events and
- * helps build up an {@link RunEvent} by passing event components to partial functions that know how
- * to convert those event components into {@link RunEvent} properties.
- *
- * <p>The event types that can be consumed to generate @link OpenLineage.RunEvent} properties have
- * no common supertype, so the generic argument for the function input is simply {@link Object}. The
- * types of arguments that may be found include
- *
- * <ul>
- *   <li>{@link org.apache.spark.scheduler.StageInfo}
- *   <li>{@link Stage}
- *   <li>{@link RDD}
- *   <li>{@link ActiveJob}
- *   <li>{@link org.apache.spark.sql.execution.QueryExecution}
- * </ul>
- *
- * <p>These components are extracted from various {@link org.apache.spark.scheduler.SparkListener}
- * events, such as {@link SparkListenerStageCompleted}, {@link SparkListenerJobStart}, and {@link
- * org.apache.spark.scheduler.SparkListenerTaskEnd}.
- *
- * <p>{@link RDD} chains will be _flattened_ so each `RDD` dependency is passed to the builders one
- * at a time. This means a builder can directly specify the type of {@link RDD} it handles, such as
- * a {@link org.apache.spark.rdd.HadoopRDD} or a {@link
- * org.apache.spark.sql.execution.datasources.FileScanRDD}, without having to check the dependencies
- * of every {@link org.apache.spark.rdd.MapPartitionsRDD} or {@link
- * org.apache.spark.sql.execution.SQLExecutionRDD}.
- *
- * <p>Any {@link RunFacet}s and {@link JobFacet}s returned by the {@link CustomFacetBuilder}s are
- * appended to the {@link OpenLineage.Run} and {@link OpenLineage.Job}, respectively.
- *
- * <p><b>If</b> any {@link OpenLineage.InputDatasetBuilder}s or {@link
- * OpenLineage.OutputDatasetBuilder}s are returned from the partial functions, the {@link
- * #inputDatasetBuilders} or {@link #outputDatasetBuilders} will be invoked using the same input
- * arguments in order to construct any {@link InputDatasetFacet}s or {@link OutputDatasetFacet}s to
- * the returned dataset. {@link InputDatasetFacet}s and {@link OutputDatasetFacet}s will be attached
- * to <i>any</i> {@link OpenLineage.InputDatasetBuilder} or {@link OpenLineage.OutputDatasetBuilder}
- * found for the event. This is because facets may be constructed from generic information that is
- * not specifically tied to a Dataset. For example, {@link
- * OpenLineage.OutputStatisticsOutputDatasetFacet}s are created from {@link
- * org.apache.spark.executor.TaskMetrics} attached to the last {@link
- * org.apache.spark.scheduler.StageInfo} for a given job execution. However, the {@link
- * OutputDataset} is constructed by reading the {@link LogicalPlan}. There's no way to tie the
- * output metrics in the {@link org.apache.spark.scheduler.StageInfo} to the {@link OutputDataset}
- * in the {@link LogicalPlan} except by inference. Similarly, input metrics can be found in the
- * {@link org.apache.spark.scheduler.StageInfo} for the stage that reads a dataset and the {@link
- * InputDataset} can usually be constructed by walking the {@link RDD} dependency tree for that
- * {@link Stage} and finding a {@link org.apache.spark.sql.execution.datasources.FileScanRDD} or
- * other concrete implementation. But while there is typically only one {@link InputDataset} read in
- * a given stage, there's no guarantee of that and the {@link org.apache.spark.executor.TaskMetrics}
- * in the {@link org.apache.spark.scheduler.StageInfo} won't disambiguate.
- *
- * <p>If a facet needs to be attached to a specific dataset, the user must take care to construct
- * both the Dataset and the Facet in the same builder.
- */
-@Slf4j
-@AllArgsConstructor
-class OpenLineageRunEventBuilder {
-
-  @NonNull private final OpenLineageContext openLineageContext;
-
-  @NonNull
-  private final Collection<PartialFunction<Object, List<InputDataset>>> inputDatasetBuilders;
-
-  @NonNull
-  private final Collection<PartialFunction<LogicalPlan, List<InputDataset>>>
-      inputDatasetQueryPlanVisitors;
-
-  @NonNull
-  private final Collection<PartialFunction<Object, List<OutputDataset>>> outputDatasetBuilders;
-
-  @NonNull
-  private final Collection<PartialFunction<LogicalPlan, List<OutputDataset>>>
-      outputDatasetQueryPlanVisitors;
-
-  @NonNull
-  private final Collection<CustomFacetBuilder<?, ? extends DatasetFacet>> datasetFacetBuilders;
-
-  @NonNull
-  private final Collection<CustomFacetBuilder<?, ? extends InputDatasetFacet>>
-      inputDatasetFacetBuilders;
-
-  @NonNull
-  private final Collection<CustomFacetBuilder<?, ? extends OutputDatasetFacet>>
-      outputDatasetFacetBuilders;
-
-  @NonNull private final Collection<CustomFacetBuilder<?, ? extends RunFacet>> runFacetBuilders;
-  @NonNull private final Collection<CustomFacetBuilder<?, ? extends JobFacet>> jobFacetBuilders;
-  @NonNull private final Collection<ColumnLevelLineageVisitor> columnLineageVisitors;
-  private final UnknownEntryFacetListener unknownEntryFacetListener =
-      UnknownEntryFacetListener.getInstance();
-  private final Map<Integer, ActiveJob> jobMap = new HashMap<>();
-  private final Map<Integer, Stage> stageMap = new HashMap<>();
-
-  OpenLineageRunEventBuilder(OpenLineageContext context, OpenLineageEventHandlerFactory factory) {
-    this(
-        context,
-        factory.createInputDatasetBuilder(context),
-        factory.createInputDatasetQueryPlanVisitors(context),
-        factory.createOutputDatasetBuilder(context),
-        factory.createOutputDatasetQueryPlanVisitors(context),
-        factory.createDatasetFacetBuilders(context),
-        factory.createInputDatasetFacetBuilders(context),
-        factory.createOutputDatasetFacetBuilders(context),
-        factory.createRunFacetBuilders(context),
-        factory.createJobFacetBuilders(context),
-        factory.createColumnLevelLineageVisitors(context));
-  }
-
-  /**
-   * Add an {@link ActiveJob} and all of its {@link Stage}s to the maps so we can look them up by id
-   * later.
-   *
-   * @param job
-   */
-  void registerJob(ActiveJob job) {
-    jobMap.put(job.jobId(), job);
-    stageMap.put(job.finalStage().id(), job.finalStage());
-    job.finalStage()
-        .parents()
-        .forall(
-            toScalaFn(
-                stage -> {
-                  stageMap.put(stage.id(), stage);
-                  return true;
-                }));
-  }
-
-  RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      SparkListenerStageSubmitted event) {
-    Stage stage = stageMap.get(event.stageInfo().stageId());
-    RDD<?> rdd = stage.rdd();
-
-    List<Object> nodes = new ArrayList<>();
-    nodes.addAll(Arrays.asList(event.stageInfo(), stage));
-
-    nodes.addAll(Rdds.flattenRDDs(rdd));
-
-    return populateRun(parentRunFacet, runEventBuilder, jobBuilder, nodes);
-  }
-
-  RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      SparkListenerStageCompleted event) {
-    Stage stage = stageMap.get(event.stageInfo().stageId());
-    RDD<?> rdd = stage.rdd();
-
-    List<Object> nodes = new ArrayList<>();
-    nodes.addAll(Arrays.asList(event.stageInfo(), stage));
-
-    nodes.addAll(Rdds.flattenRDDs(rdd));
-
-    return populateRun(parentRunFacet, runEventBuilder, jobBuilder, nodes);
-  }
-
-  RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      SparkListenerSQLExecutionStart event) {
-    runEventBuilder.eventType(RunEvent.EventType.START);
-    return buildRun(parentRunFacet, runEventBuilder, jobBuilder, event, Optional.empty());
-  }
-
-  RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      SparkListenerSQLExecutionEnd event) {
-    runEventBuilder.eventType(RunEvent.EventType.COMPLETE);
-    return buildRun(parentRunFacet, runEventBuilder, jobBuilder, event, Optional.empty());
-  }
-
-  RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      SparkListenerJobStart event) {
-    runEventBuilder.eventType(RunEvent.EventType.START);
-    return buildRun(
-        parentRunFacet,
-        runEventBuilder,
-        jobBuilder,
-        event,
-        Optional.ofNullable(jobMap.get(event.jobId())));
-  }
-
-  RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      SparkListenerJobEnd event) {
-    runEventBuilder.eventType(
-        event.jobResult() instanceof JobFailed
-            ? RunEvent.EventType.FAIL
-            : RunEvent.EventType.COMPLETE);
-    return buildRun(
-        parentRunFacet,
-        runEventBuilder,
-        jobBuilder,
-        event,
-        Optional.ofNullable(jobMap.get(event.jobId())));
-  }
-
-  private RunEvent buildRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      Object event,
-      Optional<ActiveJob> job) {
-    List<Object> nodes = new ArrayList<>();
-    nodes.add(event);
-    job.ifPresent(
-        j -> {
-          nodes.add(j);
-          nodes.addAll(Rdds.flattenRDDs(j.finalStage().rdd()));
-        });
-
-    return populateRun(parentRunFacet, runEventBuilder, jobBuilder, nodes);
-  }
-
-  private RunEvent populateRun(
-      Optional<ParentRunFacet> parentRunFacet,
-      RunEventBuilder runEventBuilder,
-      JobBuilder jobBuilder,
-      List<Object> nodes) {
-    OpenLineage openLineage = openLineageContext.getOpenLineage();
-
-    RunFacetsBuilder runFacetsBuilder = openLineage.newRunFacetsBuilder();
-    OpenLineage.JobFacetsBuilder jobFacetsBuilder =
-        openLineageContext.getOpenLineage().newJobFacetsBuilder();
-
-    parentRunFacet.ifPresent(runFacetsBuilder::parent);
-    OpenLineage.JobFacets jobFacets = buildJobFacets(nodes, jobFacetBuilders, jobFacetsBuilder);
-    List<InputDataset> inputDatasets = buildInputDatasets(nodes);
-    List<OutputDataset> outputDatasets = buildOutputDatasets(nodes);
-    openLineageContext
-        .getQueryExecution()
-        .filter(qe -> !FacetUtils.isFacetDisabled(openLineageContext, "spark_unknown"))
-        .flatMap(qe -> unknownEntryFacetListener.build(qe.optimizedPlan()))
-        .ifPresent(facet -> runFacetsBuilder.put("spark_unknown", facet));
-
-    RunFacets runFacets = buildRunFacets(nodes, runFacetBuilders, runFacetsBuilder);
-    OpenLineage.RunBuilder runBuilder =
-        openLineage.newRunBuilder().runId(openLineageContext.getRunUuid()).facets(runFacets);
-    runEventBuilder
-        .run(runBuilder.build())
-        .job(jobBuilder.facets(jobFacets).build())
-        .inputs(inputDatasets)
-        .outputs(outputDatasets);
-
-    HookUtils.preBuild(openLineageContext, runEventBuilder);
-    return runEventBuilder.build();
-  }
-
-  private List<InputDataset> buildInputDatasets(List<Object> nodes) {
-    openLineageContext
-        .getQueryExecution()
-        .ifPresent(
-            qe -> {
-              if (log.isDebugEnabled()) {
-                log.debug("Traversing optimized plan {}", qe.optimizedPlan().toJSON());
-                log.debug("Physical plan executed {}", qe.executedPlan().toJSON());
-              }
-            });
-    log.debug(
-        "Visiting query plan {} with input dataset builders {}",
-        openLineageContext.getQueryExecution(),
-        inputDatasetBuilders);
-
-    Function1<LogicalPlan, Collection<InputDataset>> inputVisitor =
-        visitLogicalPlan(PlanUtils.merge(inputDatasetQueryPlanVisitors));
-
-    List<InputDataset> datasets =
-        Stream.concat(
-                buildDatasets(nodes, inputDatasetBuilders),
-                openLineageContext
-                    .getQueryExecution()
-                    .map(
-                        qe ->
-                            fromSeq(qe.optimizedPlan().map(inputVisitor)).stream()
-                                .flatMap(Collection::stream)
-                                .map(((Class<InputDataset>) InputDataset.class)::cast))
-                    .orElse(Stream.empty()))
-            .collect(Collectors.toList());
-    OpenLineage openLineage = openLineageContext.getOpenLineage();
-    if (!datasets.isEmpty()) {
-      Map<String, InputDatasetFacet> inputFacetsMap = new HashMap<>();
-      nodes.forEach(
-          event -> inputDatasetFacetBuilders.forEach(fn -> fn.accept(event, inputFacetsMap::put)));
-      Map<String, DatasetFacets> datasetFacetsMap = new HashMap<>();
-      nodes.forEach(
-          event -> inputDatasetFacetBuilders.forEach(fn -> fn.accept(event, inputFacetsMap::put)));
-      return datasets.stream()
-          .map(
-              ds ->
-                  openLineage
-                      .newInputDatasetBuilder()
-                      .name(ds.getName())
-                      .namespace(ds.getNamespace())
-                      .inputFacets(
-                          mergeFacets(
-                              inputFacetsMap, ds.getInputFacets(), InputDatasetInputFacets.class))
-                      .facets(mergeFacets(datasetFacetsMap, ds.getFacets(), DatasetFacets.class))
-                      .build())
-          .collect(Collectors.toList());
-    }
-    return datasets;
-  }
-
-  /**
-   * Returns a {@link Function1} that passes the input {@link LogicalPlan} node to the {@link
-   * #unknownEntryFacetListener} if the inputVisitor is defined for the input node.
-   *
-   * @param inputVisitor
-   * @param <D>
-   * @return
-   */
-  private <D> Function1<LogicalPlan, Collection<D>> visitLogicalPlan(
-      PartialFunction<LogicalPlan, Collection<D>> inputVisitor) {
-    return ScalaConversionUtils.toScalaFn(
-        node ->
-            inputVisitor
-                .andThen(
-                    toScalaFn(
-                        ds -> {
-                          unknownEntryFacetListener.accept(node);
-                          return ds;
-                        }))
-                .applyOrElse(node, toScalaFn(n -> Collections.emptyList())));
-  }
-
-  private List<OutputDataset> buildOutputDatasets(List<Object> nodes) {
-    log.debug(
-        "Visiting query plan {} with output dataset builders {}",
-        openLineageContext.getQueryExecution(),
-        outputDatasetBuilders);
-    Function1<LogicalPlan, Collection<OutputDataset>> visitor =
-        visitLogicalPlan(PlanUtils.merge(outputDatasetQueryPlanVisitors));
-    List<OutputDataset> datasets =
-        Stream.concat(
-                buildDatasets(nodes, outputDatasetBuilders),
-                openLineageContext
-                    .getQueryExecution()
-                    .map(qe -> visitor.apply(qe.optimizedPlan()))
-                    .map(Collection::stream)
-                    .orElse(Stream.empty()))
-            .collect(Collectors.toList());
-
-    OpenLineage openLineage = openLineageContext.getOpenLineage();
-
-    if (!datasets.isEmpty()) {
-      Map<String, OutputDatasetFacet> outputFacetsMap = new HashMap<>();
-      nodes.forEach(
-          event ->
-              outputDatasetFacetBuilders.forEach(fn -> fn.accept(event, outputFacetsMap::put)));
-      Map<String, DatasetFacet> datasetFacetsMap = new HashMap<>();
-      nodes.forEach(
-          event -> datasetFacetBuilders.forEach(fn -> fn.accept(event, datasetFacetsMap::put)));
-      return datasets.stream()
-          .map(
-              ds -> {
-                Map<String, DatasetFacet> dsFacetsMap = new HashMap(datasetFacetsMap);
-                ColumnLevelLineageUtils.buildColumnLineageDatasetFacet(
-                        openLineageContext, ds.getFacets().getSchema())
-                    .ifPresent(facet -> dsFacetsMap.put("columnLineage", facet));
-                return openLineage
-                    .newOutputDatasetBuilder()
-                    .name(ds.getName())
-                    .namespace(ds.getNamespace())
-                    .outputFacets(
-                        mergeFacets(
-                            outputFacetsMap, ds.getOutputFacets(), OutputDatasetOutputFacets.class))
-                    .facets(mergeFacets(dsFacetsMap, ds.getFacets(), DatasetFacets.class))
-                    .build();
-              })
-          .collect(Collectors.toList());
-    }
-    return datasets;
-  }
-
-  private <T extends OpenLineage.Dataset> Stream<T> buildDatasets(
-      List<Object> nodes, Collection<PartialFunction<Object, List<T>>> builders) {
-    return nodes.stream()
-        .flatMap(
-            event ->
-                builders.stream()
-                    .filter(pfn -> PlanUtils.safeIsDefinedAt(pfn, event))
-                    .map(pfn -> PlanUtils.safeApply(pfn, event))
-                    .flatMap(Collection::stream));
-  }
-
-  /**
-   * Attach facets to a facet container, such as an {@link InputDatasetInputFacets} or an {@link
-   * OutputDatasetOutputFacets}. Facets returned by a {@link CustomFacetBuilder} may be attached to
-   * a field in the container, such as {@link InputDatasetInputFacets#dataQualityMetrics} or may be
-   * attached as a key/value pair in the {@link InputDatasetInputFacets#additionalProperties} map.
-   * The serialized JSON does not distinguish between these, but the java class does. The Java class
-   * also has some fields, such as the {@link InputDatasetInputFacets#producer} URI, which need to
-   * be included in the serialized JSON.
-   *
-   * <p>This methods will generate a new facet container with properties potentially overridden by
-   * the values set by the custom facet generators.
-   *
-   * @param events
-   * @param builders
-   * @return
-   */
-  private OpenLineage.JobFacets buildJobFacets(
-      List<Object> events,
-      Collection<CustomFacetBuilder<?, ? extends JobFacet>> builders,
-      OpenLineage.JobFacetsBuilder jobFacetsBuilder) {
-    events.forEach(event -> builders.forEach(fn -> fn.accept(event, jobFacetsBuilder::put)));
-    return jobFacetsBuilder.build();
-  }
-
-  private RunFacets buildRunFacets(
-      List<Object> events,
-      Collection<CustomFacetBuilder<?, ? extends RunFacet>> builders,
-      RunFacetsBuilder runFacetsBuilder) {
-    events.forEach(event -> builders.forEach(fn -> fn.accept(event, runFacetsBuilder::put)));
-    return runFacetsBuilder.build();
-  }
-}
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/lifecycle/plan/LogicalRelationDatasetBuilder.java b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/lifecycle/plan/LogicalRelationDatasetBuilder.java
deleted file mode 100644
index dd58b9eaf140b0..00000000000000
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/lifecycle/plan/LogicalRelationDatasetBuilder.java
+++ /dev/null
@@ -1,220 +0,0 @@
-/*
-/* Copyright 2018-2023 contributors to the OpenLineage project
-/* SPDX-License-Identifier: Apache-2.0
-*/
-
-package io.openlineage.spark.agent.lifecycle.plan;
-
-import io.openlineage.client.OpenLineage;
-import io.openlineage.client.OpenLineage.DatasetFacetsBuilder;
-import io.openlineage.client.utils.DatasetIdentifier;
-import io.openlineage.spark.agent.lifecycle.plan.handlers.JdbcRelationHandler;
-import io.openlineage.spark.agent.util.PathUtils;
-import io.openlineage.spark.agent.util.PlanUtils;
-import io.openlineage.spark.api.AbstractQueryPlanDatasetBuilder;
-import io.openlineage.spark.api.DatasetFactory;
-import io.openlineage.spark.api.OpenLineageContext;
-import java.util.ArrayList;
-import java.util.Collection;
-import java.util.Collections;
-import java.util.List;
-import java.util.Optional;
-import java.util.stream.Collectors;
-import lombok.extern.slf4j.Slf4j;
-import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.Path;
-import org.apache.spark.scheduler.SparkListenerEvent;
-import org.apache.spark.sql.catalyst.catalog.CatalogTable;
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan;
-import org.apache.spark.sql.execution.datasources.HadoopFsRelation;
-import org.apache.spark.sql.execution.datasources.LogicalRelation;
-import org.apache.spark.sql.execution.datasources.jdbc.JDBCOptions;
-import org.apache.spark.sql.execution.datasources.jdbc.JDBCRelation;
-import scala.collection.JavaConversions;
-
-/**
- * {@link LogicalPlan} visitor that attempts to extract a {@link OpenLineage.Dataset} from a {@link
- * LogicalRelation}. The {@link org.apache.spark.sql.sources.BaseRelation} is tested for known
- * types, such as {@link HadoopFsRelation} or {@link JDBCRelation}s, as those are easy to extract
- * exact dataset information.
- *
- * <p>For {@link HadoopFsRelation}s, it is assumed that a single directory maps to a single {@link
- * OpenLineage.Dataset}. Any files referenced are replaced by their parent directory and all files
- * in a given directory are assumed to belong to the same {@link OpenLineage.Dataset}. Directory
- * partitioning is currently not addressed.
- *
- * <p>For {@link JDBCRelation}s, {@link OpenLineage.Dataset} naming expects the namespace to be the
- * JDBC connection URL (schema and authority only) and the table name to be the <code>
- * &lt;database&gt;
- * </code>.<code>&lt;tableName&gt;</code>.
- *
- * <p>{@link CatalogTable}s, if present, can be used to describe the {@link OpenLineage.Dataset} if
- * its {@link org.apache.spark.sql.sources.BaseRelation} is unknown.
- *
- * <p>TODO If a user specifies the {@link JDBCOptions#JDBC_QUERY_STRING()} option, we do not parse
- * the sql to determine the specific tables used. Since we return a List of {@link
- * OpenLineage.Dataset}s, we can parse the sql and determine each table referenced to return a
- * complete list of datasets referenced.
- */
-@Slf4j
-public class LogicalRelationDatasetBuilder<D extends OpenLineage.Dataset>
-    extends AbstractQueryPlanDatasetBuilder<SparkListenerEvent, LogicalRelation, D> {
-
-  private final DatasetFactory<D> datasetFactory;
-
-  public LogicalRelationDatasetBuilder(
-      OpenLineageContext context, DatasetFactory<D> datasetFactory, boolean searchDependencies) {
-    super(context, searchDependencies);
-    this.datasetFactory = datasetFactory;
-  }
-
-  @Override
-  public boolean isDefinedAtLogicalPlan(LogicalPlan x) {
-    // if a LogicalPlan is a single node plan like `select * from temp`,
-    // then it's leaf node and should not be considered output node
-    if (x instanceof LogicalRelation && isSingleNodeLogicalPlan(x) && !searchDependencies) {
-      return false;
-    }
-
-    return x instanceof LogicalRelation
-        && (((LogicalRelation) x).relation() instanceof HadoopFsRelation
-            || ((LogicalRelation) x).relation() instanceof JDBCRelation
-            || ((LogicalRelation) x).catalogTable().isDefined());
-  }
-
-  private boolean isSingleNodeLogicalPlan(LogicalPlan x) {
-    return context
-            .getQueryExecution()
-            .map(qe -> qe.optimizedPlan())
-            .filter(p -> p.equals(x))
-            .isPresent()
-        && (x.children() == null || x.children().isEmpty());
-  }
-
-  @Override
-  public List<D> apply(LogicalRelation logRel) {
-    if (logRel.catalogTable() != null && logRel.catalogTable().isDefined()) {
-      return handleCatalogTable(logRel);
-    } else if (logRel.relation() instanceof HadoopFsRelation) {
-      return handleHadoopFsRelation(logRel);
-    } else if (logRel.relation() instanceof JDBCRelation) {
-      return new JdbcRelationHandler<>(datasetFactory).handleRelation(logRel);
-    }
-    throw new IllegalArgumentException(
-        "Expected logical plan to be either HadoopFsRelation, JDBCRelation, "
-            + "or CatalogTable but was "
-            + logRel);
-  }
-
-  private List<D> handleCatalogTable(LogicalRelation logRel) {
-    CatalogTable catalogTable = logRel.catalogTable().get();
-
-    DatasetIdentifier di = PathUtils.fromCatalogTable(catalogTable);
-
-    OpenLineage.DatasetFacetsBuilder datasetFacetsBuilder =
-        context.getOpenLineage().newDatasetFacetsBuilder();
-    datasetFacetsBuilder.schema(PlanUtils.schemaFacet(context.getOpenLineage(), logRel.schema()));
-    datasetFacetsBuilder.dataSource(
-        PlanUtils.datasourceFacet(context.getOpenLineage(), di.getNamespace()));
-
-    getDatasetVersion(logRel)
-        .map(
-            version ->
-                datasetFacetsBuilder.version(
-                    context.getOpenLineage().newDatasetVersionDatasetFacet(version)));
-
-    return Collections.singletonList(datasetFactory.getDataset(di, datasetFacetsBuilder));
-  }
-
-  private List<D> handleHadoopFsRelation(LogicalRelation x) {
-    HadoopFsRelation relation = (HadoopFsRelation) x.relation();
-    try {
-      return context
-          .getSparkSession()
-          .map(
-              session -> {
-                Configuration hadoopConfig =
-                    session.sessionState().newHadoopConfWithOptions(relation.options());
-
-                DatasetFacetsBuilder datasetFacetsBuilder =
-                    context.getOpenLineage().newDatasetFacetsBuilder();
-                getDatasetVersion(x)
-                    .map(
-                        version ->
-                            datasetFacetsBuilder.version(
-                                context.getOpenLineage().newDatasetVersionDatasetFacet(version)));
-
-                Collection<Path> rootPaths =
-                    JavaConversions.asJavaCollection(relation.location().rootPaths());
-
-                if (isSingleFileRelation(rootPaths, hadoopConfig)) {
-                  return Collections.singletonList(
-                      datasetFactory.getDataset(
-                          rootPaths.stream().findFirst().get().toUri(),
-                          relation.schema(),
-                          datasetFacetsBuilder));
-                } else {
-                  return rootPaths.stream()
-                      .map(p -> PlanUtils.getDirectoryPath(p, hadoopConfig))
-                      .distinct()
-                      .map(
-                          p -> {
-                            // TODO- refactor this to return a single partitioned dataset based on
-                            // static
-                            // static partitions in the relation
-                            return datasetFactory.getDataset(
-                                p.toUri(), relation.schema(), datasetFacetsBuilder);
-                          })
-                      .collect(Collectors.toList());
-                }
-              })
-          .orElse(Collections.emptyList());
-    } catch (Exception e) {
-      if ("com.databricks.backend.daemon.data.client.adl.AzureCredentialNotFoundExcepgittion"
-          .equals(e.getClass().getName())) {
-        // This is a fallback that can occur when hadoop configurations cannot be
-        // reached. This occurs in Azure Databricks when credential passthrough
-        // is enabled and you're attempting to get the data lake credentials.
-        // The Spark Listener context cannot use the user credentials
-        // thus we need a fallback.
-        // This is similar to the InsertIntoHadoopRelationVisitor's process for getting
-        // Datasets
-        List<D> inputDatasets = new ArrayList<D>();
-        List<Path> paths =
-            new ArrayList<>(JavaConversions.asJavaCollection(relation.location().rootPaths()));
-        for (Path p : paths) {
-          inputDatasets.add(datasetFactory.getDataset(p.toUri(), relation.schema()));
-        }
-        if (inputDatasets.isEmpty()) {
-          return Collections.emptyList();
-        } else {
-          return inputDatasets;
-        }
-      } else {
-        throw e;
-      }
-    }
-  }
-
-  private boolean isSingleFileRelation(Collection<Path> paths, Configuration hadoopConfig) {
-    if (paths.size() != 1) {
-      return false;
-    }
-
-    try {
-      Path path = paths.stream().findFirst().get();
-      return path.getFileSystem(hadoopConfig).isFile(path);
-      /*
-       Unfortunately it seems like on DataBricks this can throw an SparkException as well if credentials are missing.
-       Like org.apache.spark.SparkException: There is no Credential Scope.
-      */
-    } catch (Exception e) {
-      return false;
-    }
-  }
-
-  protected Optional<String> getDatasetVersion(LogicalRelation x) {
-    // not implemented
-    return Optional.empty();
-  }
-}
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PathUtils.java b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PathUtils.java
deleted file mode 100644
index b72d28ce72dd90..00000000000000
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PathUtils.java
+++ /dev/null
@@ -1,207 +0,0 @@
-/*
-/* Copyright 2018-2023 contributors to the OpenLineage project
-/* SPDX-License-Identifier: Apache-2.0
-*/
-
-package io.openlineage.spark.agent.util;
-
-import com.typesafe.config.Config;
-import com.typesafe.config.ConfigFactory;
-import datahub.spark.conf.SparkAppContext;
-import datahub.spark.conf.SparkConfigParser;
-import io.datahubproject.openlineage.config.DatahubOpenlineageConfig;
-import io.datahubproject.openlineage.dataset.HdfsPathDataset;
-import io.openlineage.client.utils.DatasetIdentifier;
-import io.openlineage.client.utils.DatasetIdentifierUtils;
-import java.io.File;
-import java.net.URI;
-import java.net.URISyntaxException;
-import java.util.Arrays;
-import java.util.Optional;
-import java.util.stream.Collectors;
-import lombok.SneakyThrows;
-import lombok.extern.slf4j.Slf4j;
-import org.apache.commons.lang.StringUtils;
-import org.apache.hadoop.fs.Path;
-import org.apache.spark.SparkConf;
-import org.apache.spark.sql.SparkSession;
-import org.apache.spark.sql.catalyst.TableIdentifier;
-import org.apache.spark.sql.catalyst.catalog.CatalogTable;
-import org.apache.spark.sql.internal.StaticSQLConf;
-
-@Slf4j
-@SuppressWarnings("checkstyle:HideUtilityClassConstructor")
-public class PathUtils {
-
-  private static final String DEFAULT_SCHEME = "file";
-  public static final String SPARK_OPENLINEAGE_DATASET_REMOVE_PATH_PATTERN =
-      "spark.openlineage.dataset.removePath.pattern";
-  public static final String REMOVE_PATTERN_GROUP = "remove";
-
-  private static Optional<SparkConf> sparkConf = Optional.empty();
-
-  public static DatasetIdentifier fromPath(Path path) {
-    return fromPath(path, DEFAULT_SCHEME);
-  }
-
-  public static DatasetIdentifier fromPath(Path path, String defaultScheme) {
-    return fromURI(path.toUri(), defaultScheme);
-  }
-
-  public static DatasetIdentifier fromURI(URI location) {
-    return fromURI(location, DEFAULT_SCHEME);
-  }
-
-  public static DatasetIdentifier fromURI(URI location, String defaultScheme) {
-    DatasetIdentifier di = DatasetIdentifierUtils.fromURI(location, defaultScheme);
-    return new DatasetIdentifier(removePathPattern(di.getName()), di.getNamespace());
-  }
-
-  public static DatasetIdentifier fromCatalogTable(CatalogTable catalogTable) {
-    return fromCatalogTable(catalogTable, loadSparkConf());
-  }
-
-  /**
-   * Create DatasetIdentifier from CatalogTable, using storage's locationURI if it exists. In other
-   * way, use defaultTablePath.
-   */
-  @SneakyThrows
-  public static DatasetIdentifier fromCatalogTable(
-      CatalogTable catalogTable, Optional<SparkConf> sparkConf) {
-
-    DatasetIdentifier di;
-    if (catalogTable.storage() != null && catalogTable.storage().locationUri().isDefined()) {
-      di = PathUtils.fromURI(catalogTable.storage().locationUri().get(), DEFAULT_SCHEME);
-    } else {
-      // try to obtain location
-      try {
-        di = prepareDatasetIdentifierFromDefaultTablePath(catalogTable);
-      } catch (IllegalStateException e) {
-        // session inactive - no way to find DatasetProvider
-        throw new IllegalArgumentException(
-            "Unable to extract DatasetIdentifier from a CatalogTable", e);
-      }
-    }
-
-    Optional<URI> metastoreUri = extractMetastoreUri(sparkConf);
-    // TODO: Is the call to "metastoreUri.get()" really needed?
-    //   Java's Optional should prevent the null in the first place.
-    if (metastoreUri.isPresent() && metastoreUri.get() != null) {
-      // dealing with Hive tables
-      DatasetIdentifier symlink = prepareHiveDatasetIdentifier(catalogTable, metastoreUri.get());
-      return di.withSymlink(
-          symlink.getName(), symlink.getNamespace(), DatasetIdentifier.SymlinkType.TABLE);
-    } else {
-      return di.withSymlink(
-          nameFromTableIdentifier(catalogTable.identifier()),
-          StringUtils.substringBeforeLast(di.getName(), File.separator),
-          DatasetIdentifier.SymlinkType.TABLE);
-    }
-  }
-
-  @SneakyThrows
-  private static DatasetIdentifier prepareDatasetIdentifierFromDefaultTablePath(
-      CatalogTable catalogTable) {
-    URI uri =
-        SparkSession.active().sessionState().catalog().defaultTablePath(catalogTable.identifier());
-
-    return PathUtils.fromURI(uri);
-  }
-
-  @SneakyThrows
-  private static DatasetIdentifier prepareHiveDatasetIdentifier(
-      CatalogTable catalogTable, URI metastoreUri) {
-    String qualifiedName = nameFromTableIdentifier(catalogTable.identifier());
-    if (!qualifiedName.startsWith("/")) {
-      qualifiedName = String.format("/%s", qualifiedName);
-    }
-    return PathUtils.fromPath(
-        new Path(enrichHiveMetastoreURIWithTableName(metastoreUri, qualifiedName)));
-  }
-
-  @SneakyThrows
-  public static URI enrichHiveMetastoreURIWithTableName(URI metastoreUri, String qualifiedName) {
-    return new URI(
-        "hive", null, metastoreUri.getHost(), metastoreUri.getPort(), qualifiedName, null, null);
-  }
-
-  /**
-   * SparkConf does not change through job lifetime but it can get lost once session is closed. It's
-   * good to have it set in case of SPARK-29046
-   */
-  private static Optional<SparkConf> loadSparkConf() {
-    if (!sparkConf.isPresent() && SparkSession.getDefaultSession().isDefined()) {
-      sparkConf = Optional.of(SparkSession.getDefaultSession().get().sparkContext().getConf());
-    }
-    return sparkConf;
-  }
-
-  private static Optional<URI> extractMetastoreUri(Optional<SparkConf> sparkConf) {
-    // make sure SparkConf is present
-    if (!sparkConf.isPresent()) {
-      return Optional.empty();
-    }
-
-    // make sure enableHiveSupport is called
-    Optional<String> setting =
-        SparkConfUtils.findSparkConfigKey(
-            sparkConf.get(), StaticSQLConf.CATALOG_IMPLEMENTATION().key());
-    if (!setting.isPresent() || !"hive".equals(setting.get())) {
-      return Optional.empty();
-    }
-
-    return SparkConfUtils.getMetastoreUri(sparkConf.get());
-  }
-
-  private static String removeFirstSlashIfSingleSlashInString(String name) {
-    if (name.chars().filter(x -> x == '/').count() == 1 && name.startsWith("/")) {
-      return name.substring(1);
-    }
-    return name;
-  }
-
-  private static String removePathPattern(String datasetName) {
-    // TODO: The reliance on global-mutable state here should be changed
-    //  this led to problems in the PathUtilsTest class, where some tests interfered with others
-    log.info("Removing path pattern from dataset name {}", datasetName);
-    Optional<SparkConf> conf = loadSparkConf();
-    if (!conf.isPresent()) {
-      return datasetName;
-    }
-    try {
-      String propertiesString =
-          Arrays.stream(conf.get().getAllWithPrefix("spark.datahub."))
-              .map(tup -> tup._1 + "= \"" + tup._2 + "\"")
-              .collect(Collectors.joining("\n"));
-      Config datahubConfig = ConfigFactory.parseString(propertiesString);
-      DatahubOpenlineageConfig datahubOpenlineageConfig =
-          SparkConfigParser.sparkConfigToDatahubOpenlineageConf(
-              datahubConfig, new SparkAppContext());
-      HdfsPathDataset hdfsPath =
-          HdfsPathDataset.create(new URI(datasetName), datahubOpenlineageConfig);
-      log.debug("Transformed path is {}", hdfsPath.getDatasetPath());
-      return hdfsPath.getDatasetPath();
-    } catch (InstantiationException e) {
-      log.warn(
-          "Unable to convert dataset {} to path the exception was {}", datasetName, e.getMessage());
-      return datasetName;
-    } catch (URISyntaxException e) {
-      throw new RuntimeException(e);
-    }
-  }
-
-  private static String nameFromTableIdentifier(TableIdentifier identifier) {
-    // we create name instead of calling `unquotedString` method which includes spark_catalog
-    // for Spark 3.4
-    String name;
-    if (identifier.database().isDefined()) {
-      // include database in name
-      name = String.format("%s.%s", identifier.database().get(), identifier.table());
-    } else {
-      // just table name
-      name = identifier.table();
-    }
-
-    return name;
-  }
-}
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PlanUtils.java b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PlanUtils.java
index 8d93b0288b5151..d46d741d155b8b 100644
--- a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PlanUtils.java
+++ b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/PlanUtils.java
@@ -1,16 +1,19 @@
 /*
-/* Copyright 2018-2023 contributors to the OpenLineage project
+/* Copyright 2018-2024 contributors to the OpenLineage project
 /* SPDX-License-Identifier: Apache-2.0
 */
 
 package io.openlineage.spark.agent.util;
 
+import static io.openlineage.spark.agent.lifecycle.ExecutionContext.CAMEL_TO_SNAKE_CASE;
+
 import com.typesafe.config.Config;
 import com.typesafe.config.ConfigFactory;
 import datahub.spark.conf.SparkLineageConf;
 import io.datahubproject.openlineage.dataset.HdfsPathDataset;
 import io.openlineage.client.OpenLineage;
 import io.openlineage.spark.agent.Versions;
+import java.io.IOException;
 import java.net.URI;
 import java.net.URISyntaxException;
 import java.util.ArrayList;
@@ -18,71 +21,44 @@
 import java.util.Collection;
 import java.util.Collections;
 import java.util.List;
+import java.util.Locale;
 import java.util.Objects;
 import java.util.Optional;
 import java.util.UUID;
 import java.util.stream.Collectors;
-import java.util.stream.Stream;
 import lombok.extern.slf4j.Slf4j;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.fs.Path;
-import org.apache.hadoop.mapred.FileInputFormat;
 import org.apache.spark.SparkConf;
 import org.apache.spark.SparkEnv;
-import org.apache.spark.package$;
-import org.apache.spark.rdd.HadoopRDD;
 import org.apache.spark.rdd.RDD;
 import org.apache.spark.sql.catalyst.expressions.Attribute;
-import org.apache.spark.sql.execution.datasources.FileScanRDD;
 import org.apache.spark.sql.types.StructField;
 import org.apache.spark.sql.types.StructType;
 import scala.PartialFunction;
-import scala.runtime.AbstractPartialFunction;
+import scala.PartialFunction$;
 
 /**
  * Utility functions for traversing a {@link
  * org.apache.spark.sql.catalyst.plans.logical.LogicalPlan}.
  */
 @Slf4j
-@SuppressWarnings("checkstyle:HideUtilityClassConstructor")
 public class PlanUtils {
-
-  public static final String SLASH_DELIMITER_USER_PASSWORD_REGEX =
-      "[A-Za-z0-9_%]+//?[A-Za-z0-9_%]*@";
-  public static final String COLON_DELIMITER_USER_PASSWORD_REGEX =
-      "([/|,])[A-Za-z0-9_%]+:?[A-Za-z0-9_%]*@";
-
-  /**
-   * Merge a list of {@link PartialFunction}s and return the first value where the function is
-   * defined or empty list if no function matches the input.
-   *
-   * @param fns
-   * @param arg
-   * @param <T>
-   * @param <R>
-   * @return
-   */
-  public static <T, R> Collection<R> applyAll(
-      List<? extends PartialFunction<T, ? extends Collection<R>>> fns, T arg) {
-    PartialFunction<T, Collection<R>> fn = merge(fns);
-    if (fn.isDefinedAt(arg)) {
-      return fn.apply(arg);
-    }
-    return Collections.emptyList();
-  }
-
   /**
    * Given a list of {@link PartialFunction}s merge to produce a single function that will test the
-   * input against each function one by one until a match is found or empty() is returned.
+   * input against each function one by one until a match is found or {@link
+   * PartialFunction$#empty()} is returned.
    *
    * @param fns
    * @param <T>
    * @param <D>
    * @return
    */
-  public static <T, D> PartialFunction<T, Collection<D>> merge(
+  public static <T, D> OpenLineageAbstractPartialFunction<T, Collection<D>> merge(
       Collection<? extends PartialFunction<T, ? extends Collection<D>>> fns) {
-    return new AbstractPartialFunction<T, Collection<D>>() {
+    return new OpenLineageAbstractPartialFunction<T, Collection<D>>() {
+      String appliedClassName;
+
       @Override
       public boolean isDefinedAt(T x) {
         return fns.stream()
@@ -110,6 +86,7 @@ public Collection<D> apply(T x) {
                           x.getClass().getCanonicalName(),
                           collection);
                     }
+                    appliedClassName = x.getClass().getName();
                     return collection;
                   } catch (RuntimeException | NoClassDefFoundError | NoSuchMethodError e) {
                     log.error("Apply failed:", e);
@@ -120,6 +97,11 @@ public Collection<D> apply(T x) {
             .flatMap(Collection::stream)
             .collect(Collectors.toList());
       }
+
+      @Override
+      String appliedName() {
+        return appliedClassName;
+      }
     };
   }
 
@@ -204,12 +186,26 @@ public static OpenLineage.ParentRunFacet parentRunFacet(
         .run(new OpenLineage.ParentRunFacetRunBuilder().runId(parentRunId).build())
         .job(
             new OpenLineage.ParentRunFacetJobBuilder()
-                .name(parentJob)
+                .name(parentJob.replaceAll(CAMEL_TO_SNAKE_CASE, "_$1").toLowerCase(Locale.ROOT))
                 .namespace(parentJobNamespace)
                 .build())
         .build();
   }
 
+  public static Path getDirectoryPathOl(Path p, Configuration hadoopConf) {
+    try {
+      if (p.getFileSystem(hadoopConf).getFileStatus(p).isFile()) {
+        return p.getParent();
+      } else {
+        return p;
+      }
+    } catch (IOException e) {
+      log.warn("Unable to get file system for path ", e);
+      return p;
+    }
+  }
+
+  // This method was replaced to support Datahub PathSpecs
   public static Path getDirectoryPath(Path p, Configuration hadoopConf) {
     SparkConf conf = SparkEnv.get().conf();
     String propertiesString =
@@ -229,17 +225,6 @@ public static Path getDirectoryPath(Path p, Configuration hadoopConf) {
       log.warn("Unable to convert path to hdfs path {} the exception was {}", p, e.getMessage());
       return p;
     }
-
-    // try {
-    // if (p.getFileSystem(hadoopConf).getFileStatus(p).isFile()) {
-    // return p.getParent();
-    // } else {
-    // return p;
-    // }
-    // } catch (IOException e) {
-    // log.warn("Unable to get file system for path ", e);
-    // return p;
-    // }
   }
 
   /**
@@ -251,36 +236,7 @@ public static Path getDirectoryPath(Path p, Configuration hadoopConf) {
    */
   public static List<Path> findRDDPaths(List<RDD<?>> fileRdds) {
     return fileRdds.stream()
-        .flatMap(
-            rdd -> {
-              if (rdd instanceof HadoopRDD) {
-                HadoopRDD hadoopRDD = (HadoopRDD) rdd;
-                Path[] inputPaths = FileInputFormat.getInputPaths(hadoopRDD.getJobConf());
-                Configuration hadoopConf = hadoopRDD.getConf();
-                return Arrays.stream(inputPaths)
-                    .map(p -> PlanUtils.getDirectoryPath(p, hadoopConf));
-              } else if (rdd instanceof FileScanRDD) {
-                FileScanRDD fileScanRDD = (FileScanRDD) rdd;
-                return ScalaConversionUtils.fromSeq(fileScanRDD.filePartitions()).stream()
-                    .flatMap(fp -> Arrays.stream(fp.files()))
-                    .map(
-                        f -> {
-                          if (package$.MODULE$.SPARK_VERSION().compareTo("3.4") > 0) {
-                            // filePath returns SparkPath for Spark 3.4
-                            return ReflectionUtils.tryExecuteMethod(f, "filePath")
-                                .map(o -> ReflectionUtils.tryExecuteMethod(o, "toPath"))
-                                .map(o -> (Path) o.get())
-                                .get()
-                                .getParent();
-                          } else {
-                            return new Path(f.filePath()).getParent();
-                          }
-                        });
-              } else {
-                log.warn("Unknown RDD class {}", rdd.getClass().getCanonicalName());
-                return Stream.empty();
-              }
-            })
+        .flatMap(RddPathUtils::findRDDPaths)
         .distinct()
         .collect(Collectors.toList());
   }
@@ -316,11 +272,11 @@ public static boolean safeIsDefinedAt(PartialFunction pfn, Object x) {
       return false;
     } catch (Exception e) {
       if (e != null) {
-        log.debug("isDefinedAt method failed on {}", e);
+        log.info("isDefinedAt method failed on {}", e);
       }
       return false;
     } catch (NoClassDefFoundError e) {
-      log.debug("isDefinedAt method failed on {}", e.getMessage());
+      log.info("isDefinedAt method failed on {}", e.getMessage());
       return false;
     }
   }
@@ -331,6 +287,8 @@ public static boolean safeIsDefinedAt(PartialFunction pfn, Object x) {
    * @param pfn
    * @param x
    * @return
+   * @param <T>
+   * @param <D>
    */
   public static <T, D> List<T> safeApply(PartialFunction<D, List<T>> pfn, D x) {
     try {
diff --git a/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/RemovePathPatternUtils.java b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/RemovePathPatternUtils.java
new file mode 100644
index 00000000000000..a606a44ddd5160
--- /dev/null
+++ b/metadata-integration/java/spark-lineage-beta/src/main/java/io/openlineage/spark/agent/util/RemovePathPatternUtils.java
@@ -0,0 +1,182 @@
+/*
+/* Copyright 2018-2024 contributors to the OpenLineage project
+/* SPDX-License-Identifier: Apache-2.0
+*/
+
+package io.openlineage.spark.agent.util;
+
+import com.typesafe.config.Config;
+import com.typesafe.config.ConfigFactory;
+import datahub.spark.conf.SparkAppContext;
+import datahub.spark.conf.SparkConfigParser;
+import io.datahubproject.openlineage.config.DatahubOpenlineageConfig;
+import io.datahubproject.openlineage.dataset.HdfsPathDataset;
+import io.openlineage.client.OpenLineage.InputDataset;
+import io.openlineage.client.OpenLineage.OutputDataset;
+import io.openlineage.spark.api.OpenLineageContext;
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Optional;
+import java.util.regex.Pattern;
+import java.util.stream.Collectors;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang.StringUtils;
+import org.apache.spark.SparkConf;
+import org.apache.spark.sql.SparkSession;
+
+/**
+ * Utility class to handle removing path patterns in dataset names. Given a configured regex pattern
+ * with "remove" group defined, class methods run regex replacements on all the datasets available
+ * within the event
+ */
+@Slf4j
+public class RemovePathPatternUtils {
+  public static final String REMOVE_PATTERN_GROUP = "remove";
+  public static final String SPARK_OPENLINEAGE_DATASET_REMOVE_PATH_PATTERN =
+      "spark.openlineage.dataset.removePath.pattern";
+
+  private static Optional<SparkConf> sparkConf = Optional.empty();
+
+  public static List<OutputDataset> removeOutputsPathPattern_ol(
+      OpenLineageContext context, List<OutputDataset> outputs) {
+    return getPattern(context)
+        .map(
+            pattern ->
+                outputs.stream()
+                    .map(
+                        dataset -> {
+                          String newName = removePath(pattern, dataset.getName());
+                          if (newName != dataset.getName()) {
+                            return context
+                                .getOpenLineage()
+                                .newOutputDatasetBuilder()
+                                .name(removePath(pattern, dataset.getName()))
+                                .namespace(dataset.getNamespace())
+                                .facets(dataset.getFacets())
+                                .outputFacets(dataset.getOutputFacets())
+                                .build();
+                          } else {
+                            return dataset;
+                          }
+                        })
+                    .collect(Collectors.toList()))
+        .orElse(outputs);
+  }
+
+  // This method was replaced to support Datahub PathSpecs
+  public static List<OutputDataset> removeOutputsPathPattern(
+      OpenLineageContext context, List<OutputDataset> outputs) {
+    return outputs.stream()
+        .map(
+            dataset -> {
+              String newName = removePathPattern(dataset.getName());
+              if (newName != dataset.getName()) {
+                return context
+                    .getOpenLineage()
+                    .newOutputDatasetBuilder()
+                    .name(newName)
+                    .namespace(dataset.getNamespace())
+                    .facets(dataset.getFacets())
+                    .outputFacets(dataset.getOutputFacets())
+                    .build();
+              } else {
+                return dataset;
+              }
+            })
+        .collect(Collectors.toList());
+  }
+
+  // This method was replaced to support Datahub PathSpecs
+  public static List<InputDataset> removeInputsPathPattern(
+      OpenLineageContext context, List<InputDataset> inputs) {
+    return inputs.stream()
+        .map(
+            dataset -> {
+              String newName = removePathPattern(dataset.getName());
+              if (newName != dataset.getName()) {
+                return context
+                    .getOpenLineage()
+                    .newInputDatasetBuilder()
+                    .name(newName)
+                    .namespace(dataset.getNamespace())
+                    .facets(dataset.getFacets())
+                    .inputFacets(dataset.getInputFacets())
+                    .build();
+              } else {
+                return dataset;
+              }
+            })
+        .collect(Collectors.toList());
+  }
+
+  private static Optional<Pattern> getPattern(OpenLineageContext context) {
+    return Optional.ofNullable(context.getSparkContext())
+        .map(sparkContext -> sparkContext.conf())
+        .filter(conf -> conf.contains(SPARK_OPENLINEAGE_DATASET_REMOVE_PATH_PATTERN))
+        .map(conf -> conf.get(SPARK_OPENLINEAGE_DATASET_REMOVE_PATH_PATTERN))
+        .map(pattern -> Pattern.compile(pattern));
+  }
+
+  private static String removePath(Pattern pattern, String name) {
+    return Optional.ofNullable(pattern.matcher(name))
+        .filter(matcher -> matcher.find())
+        .filter(
+            matcher -> {
+              try {
+                matcher.group(REMOVE_PATTERN_GROUP);
+                return true;
+              } catch (IllegalStateException | IllegalArgumentException e) {
+                return false;
+              }
+            })
+        .filter(matcher -> StringUtils.isNotEmpty(matcher.group(REMOVE_PATTERN_GROUP)))
+        .map(
+            matcher ->
+                name.substring(0, matcher.start(REMOVE_PATTERN_GROUP))
+                    + name.substring(matcher.end(REMOVE_PATTERN_GROUP), name.length()))
+        .orElse(name);
+  }
+
+  /**
+   * SparkConf does not change through job lifetime but it can get lost once session is closed. It's
+   * good to have it set in case of SPARK-29046
+   */
+  private static Optional<SparkConf> loadSparkConf() {
+    if (!sparkConf.isPresent() && SparkSession.getDefaultSession().isDefined()) {
+      sparkConf = Optional.of(SparkSession.getDefaultSession().get().sparkContext().getConf());
+    }
+    return sparkConf;
+  }
+
+  private static String removePathPattern(String datasetName) {
+    // TODO: The reliance on global-mutable state here should be changed
+    //  this led to problems in the PathUtilsTest class, where some tests interfered with others
+    log.info("Removing path pattern from dataset name {}", datasetName);
+    Optional<SparkConf> conf = loadSparkConf();
+    if (!conf.isPresent()) {
+      return datasetName;
+    }
+    try {
+      String propertiesString =
+          Arrays.stream(conf.get().getAllWithPrefix("spark.datahub."))
+              .map(tup -> tup._1 + "= \"" + tup._2 + "\"")
+              .collect(Collectors.joining("\n"));
+      Config datahubConfig = ConfigFactory.parseString(propertiesString);
+      DatahubOpenlineageConfig datahubOpenlineageConfig =
+          SparkConfigParser.sparkConfigToDatahubOpenlineageConf(
+              datahubConfig, new SparkAppContext());
+      HdfsPathDataset hdfsPath =
+          HdfsPathDataset.create(new URI(datasetName), datahubOpenlineageConfig);
+      log.debug("Transformed path is {}", hdfsPath.getDatasetPath());
+      return hdfsPath.getDatasetPath();
+    } catch (InstantiationException e) {
+      log.warn(
+          "Unable to convert dataset {} to path the exception was {}", datasetName, e.getMessage());
+      return datasetName;
+    } catch (URISyntaxException e) {
+      throw new RuntimeException(e);
+    }
+  }
+}
diff --git a/metadata-integration/java/spark-lineage-beta/src/test/resources/ol_events/sample_spark.json b/metadata-integration/java/spark-lineage-beta/src/test/resources/ol_events/sample_spark.json
index 77a6ebc4044bdf..acb7f585e98c90 100644
--- a/metadata-integration/java/spark-lineage-beta/src/test/resources/ol_events/sample_spark.json
+++ b/metadata-integration/java/spark-lineage-beta/src/test/resources/ol_events/sample_spark.json
@@ -40,7 +40,7 @@
   "inputs": [
     {
       "namespace": "file",
-      "name": "/Users/treff7es/shadow/spark-test/people.json",
+      "name": "/my_folder/spark-test/people.json",
       "facets": {
         "dataSource": {
           "_producer": "https://github.com/OpenLineage/OpenLineage/tree/1.2.2/integration/spark",
@@ -69,7 +69,7 @@
   "outputs": [
     {
       "namespace": "file",
-      "name": "/Users/treff7es/shadow/spark-test/result",
+      "name": "/my_folder/shadow/spark-test/result",
       "facets": {
         "dataSource": {
           "_producer": "https://github.com/OpenLineage/OpenLineage/tree/1.2.2/integration/spark",
@@ -95,7 +95,7 @@
               "inputFields": [
                 {
                   "namespace": "file",
-                  "name": "/Users/treff7es/shadow/spark-test/people.json",
+                  "name": "/my_folder/spark-test/people.json",
                   "field": "name"
                 }
               ]
diff --git a/metadata-integration/java/spark-lineage/build.gradle b/metadata-integration/java/spark-lineage/build.gradle
index 1b3c87288abf82..8db8a09f8cc813 100644
--- a/metadata-integration/java/spark-lineage/build.gradle
+++ b/metadata-integration/java/spark-lineage/build.gradle
@@ -48,7 +48,7 @@ dependencies {
 
   provided(externalDependency.sparkSql)
   provided(externalDependency.sparkHive)
-  implementation externalDependency.httpAsyncClient
+  implementation externalDependency.httpClient
 
   // Tests need a concrete log4j available. Providing it here
   testImplementation 'org.apache.logging.log4j:log4j-api:2.17.1'
@@ -106,7 +106,7 @@ shadowJar {
 
   relocate 'com.fasterxml.jackson', 'datahub.shaded.jackson'
   relocate 'org.slf4j','datahub.shaded.org.slf4j'
-  relocate 'org.apache.http','datahub.spark2.shaded.http'
+  relocate 'org.apache.hc','datahub.spark2.shaded.http'
   relocate 'org.apache.commons.codec', 'datahub.spark2.shaded.o.a.c.codec'
   relocate 'org.apache.commons.compress', 'datahub.spark2.shaded.o.a.c.compress'
   relocate 'org.apache.commons.io', 'datahub.spark2.shaded.o.a.c.io'