From 461ba01f08e16ba592b65c3bf475a78871b96be4 Mon Sep 17 00:00:00 2001
From: Helen Yang <hyingyang@gmail.com>
Date: Thu, 29 Sep 2022 09:45:54 -0700
Subject: [PATCH 01/68] Add Data Models in Feathr (#659)

* Add Data Models in Feathr

This RB is to create data models based on proposal: https://microsoft-my.sharepoint.com/:w:/g/personal/djkim_linkedin_biz/EZspGt7jJlRAqHTICZg3UbcBgQQ_VncOgM48hKW--T8qkg?e=T4N3zw

* Update models.py

* Update models.py

* Update models.py

* Update models.py

* Update models.py
---
 registry/data-models/__init__.py           |   0
 registry/data-models/data-model-diagram.md |  61 +++++++++
 registry/data-models/models.py             | 146 +++++++++++++++++++++
 3 files changed, 207 insertions(+)
 create mode 100644 registry/data-models/__init__.py
 create mode 100644 registry/data-models/data-model-diagram.md
 create mode 100644 registry/data-models/models.py

diff --git a/registry/data-models/__init__.py b/registry/data-models/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/registry/data-models/data-model-diagram.md b/registry/data-models/data-model-diagram.md
new file mode 100644
index 000000000..e43ffa0af
--- /dev/null
+++ b/registry/data-models/data-model-diagram.md
@@ -0,0 +1,61 @@
+
+# Feathr Abstract backend Data Model Diagram
+
+This file defines abstract backend data models diagram for feature registry.
+[Python Code](./models.py)
+
+```mermaid
+classDiagram
+    Project "1" --> "n" FeatureName : contains
+    Project "1" --> "n" Anchor : contains
+    FeatureName "1" --> "n" Feature : contains
+    Anchor "1" --> "n" Feature : contains
+    Feature <|-- AnchorFeature : extends
+    Feature <|-- DerivedFeature: extends
+    Feature --> Transformation
+    Feature  -->  Transformation : contains
+    Source <|-- DataSource: extends
+    Source <|-- MultiFeatureSource: extends
+    MultiFeatureSource "1" --> "1..n" FeatureSource: contains
+    AnchorFeature  -->  DataSource : contains
+    DerivedFeature -->  MultiFeatureSource: contains
+
+    class Source{
+    }
+    class DataSource{
+    }
+    class FeatureSource{
+        +FeatureNameId feature_name_id
+    }
+    class MultiFeatureSource{
+        +List[FeatureSource] sources
+    }
+    class Feature{
+        +FeatureId id
+        +FeatureNameId feature_namme_id
+        +Source source
+        +Transformation transformation
+    }
+    class AnchorFeature{
+        +DataSource source
+    }
+    class DerivedFeature{
+        +MultiFeatureSource source
+    }
+    class FeatureName{
+        +FeatureNameId id
+        +ProjectId project_id
+        +List[FeatureId] feature_ids
+    }
+    class Project{
+        +ProjectId id
+        +List[FeatureNameId] feature_name_ids
+        +List[AnchorId] anchor_ids
+    }
+    class Anchor{
+        +AnchorId id
+        +ProjectId project_id
+        +DataSource source
+        +List[FeatureId] anchor_feature_ids
+    }
+```
\ No newline at end of file
diff --git a/registry/data-models/models.py b/registry/data-models/models.py
new file mode 100644
index 000000000..c4ae31f68
--- /dev/null
+++ b/registry/data-models/models.py
@@ -0,0 +1,146 @@
+from pydantic import BaseModel
+from typing import List
+
+"""
+This file defines abstract backend data models for feature registry.
+Backend data models will be used by backend API server to talk to feature registry backend.
+Purpose of this is to decouple backend data models from API specific data models.
+For each feature registry provider/implementation, they will extend this abstract
+data models and backend API.
+Diagram of the data models:  ./data-model-diagram.md
+"""
+
+
+class FeatureId(BaseModel):
+    """
+    Id for Feature, it's unique ID represents Feature.
+    Id can be a simple string, int or complex key.
+    """
+    id: str  # id of a feature
+
+
+class FeatureNameId(BaseModel):
+    """
+    Id for FeatureName, it's unique ID represents FeatureName.
+    Id can be a simple string, int or complex key.
+    """
+    id: str  # id of a FeatureName
+
+
+class AnchorId(BaseModel):
+    """
+    Id for Anchor, it's unique ID represents Anchor.
+    Id can be a simple string, int or complex key.
+    """
+    id: str  # id of a anchor
+
+
+class ProjectId(BaseModel):
+    """
+    Id for Project, it's unique ID represents Project.
+    Id can be a simple string, int or complex key.
+    """
+    id: str  # id of a project
+
+
+class Source(BaseModel):
+    """
+    Source of the feature.
+    It defines where the feature is extracted or derived from.
+    """
+    pass
+
+
+class DataSource(Source):
+    """
+    Data source of the feature.
+    It defines the raw data source the feature is extracted from.
+    """
+    pass
+
+
+class FeatureSource(BaseModel):
+    """
+    Represents a feature source for a derived feature. That is, it is a source 'FeatureName' which is used for
+    creating other derived features.
+    """
+    input_feature_name_id: FeatureNameId  # Input feature name Key
+
+
+class MultiFeatureSource(Source):
+    """
+    Feature sources of the feature.
+    It defines one to many features where the feature is derived from.
+    """
+    sources: List[FeatureSource]  # All source features which the feature is derived from
+    pass
+
+
+class Transformation(BaseModel):
+    """
+    The transformation of a Feature.
+    A transformation function represents the transformation logic to produce feature value from the source of FeatureAnchor
+    """
+    pass
+
+
+class Feature(BaseModel):
+    """
+    Actual implementation of FeatureName.
+    An implementation defines where a feature is extracted from (Source) and how it is computed (Transformation).
+    The Source of a feature can be raw data sources and/or other features.
+    """
+    id: FeatureId  # Unique ID for Feature
+    feature_name_id: FeatureNameId  # Id of the feature name that the feature belongs to
+    source: Source  # Source can be either data source or feature source
+    transformation: Transformation  # transformation logic to produce feature value
+
+
+class AnchorFeature(Feature):
+    """
+    Feature implementation of FeatureName which anchored to a data source.
+    """
+    source: DataSource  # Raw data source where the feature is extracted from
+
+
+class DerivedFeature(Feature):
+    """
+    Feature implementation that is derived from other FeatureNames.
+    """
+    source: MultiFeatureSource  # Source features where the feature is derived from
+
+
+class FeatureName(BaseModel):
+    """
+    Named Feature Interface that can be backed by multiple Feature implementations across
+    different environments accessing different sources (data lake access for batch training,
+    KV store access for online serving). Each FeatureName is defined by feature producer.
+    Feature consumers reference a feature by that name to access that feature data,
+    agnostic of runtime environment. Each FeatureName also encloses attributes that does not
+    change across implementations.
+    """
+    id: FeatureNameId  # unique ID for FeatureName, used to extract data for current FeatureName
+    project_id: ProjectId  # ID of the project the FeatureName belongs to
+    feature_ids: List[FeatureId]  # List of ids of feature that the FeatureName has
+
+
+class Project(BaseModel):
+    """
+    Group of FeatureNames. It can be a project the team is working on,
+    or a namespace which related FeatureNames have.
+    """
+    id: ProjectId  # Unique ID of the project.
+    feature_name_ids: List[FeatureNameId]  # List of feature name ids that the project has
+    anchor_ids: List[AnchorId]   # List of Anchor ids that the project has
+
+
+class Anchor(BaseModel):
+    """
+    Group of AnchorFeatures which anchored on same DataSource.
+    This is mainly used by feature producer gather information about DataSource
+    and FeatureImplementations associated with the DataSource.
+    """
+    id: AnchorId  # Unique ID for Anchor
+    project_id: ProjectId  # ID of Project that the anchor belongs to
+    source: DataSource  # data source of the Anchor
+    anchor_feature_ids: List[FeatureId]  # List of anchor features that the anchor has

From d187ae277113ec50b6f5461f3eff1f9eed48a198 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Fri, 30 Sep 2022 12:50:02 +0800
Subject: [PATCH 02/68] Revert "Enhance purview registry error messages (#709)"
 (#720)

This reverts commit 059f2b4b6311632b15adf64b1a38f493981b155e.
---
 ...d-and-push-feathr-registry-docker-image.md |  6 +--
 registry/purview-registry/main.py             | 47 +------------------
 .../registry/purview_registry.py              | 34 ++++++--------
 3 files changed, 17 insertions(+), 70 deletions(-)

diff --git a/docs/dev_guide/build-and-push-feathr-registry-docker-image.md b/docs/dev_guide/build-and-push-feathr-registry-docker-image.md
index 04b1fe487..873c6a141 100644
--- a/docs/dev_guide/build-and-push-feathr-registry-docker-image.md
+++ b/docs/dev_guide/build-and-push-feathr-registry-docker-image.md
@@ -76,8 +76,4 @@ docker push feathrfeaturestore/feathr-registry
 
 ## Published Feathr Registry Image
 
-The published feathr feature registry is located in [DockerHub here](https://hub.docker.com/r/feathrfeaturestore/feathr-registry).
-
-## Include the detailed track back info in registry api HTTP error response
-
-Set environment REGISTRY_DEBUGGING to any non empty string will enable the detailed track back info in registry api http response. This variable is helpful for python client debugging and should only be used for debugging purposes.
+The published feathr feature registry is located in [DockerHub here](https://hub.docker.com/r/feathrfeaturestore/feathr-registry).
\ No newline at end of file
diff --git a/registry/purview-registry/main.py b/registry/purview-registry/main.py
index 92aa8dc49..5d38adf74 100644
--- a/registry/purview-registry/main.py
+++ b/registry/purview-registry/main.py
@@ -1,12 +1,11 @@
 import os
-import traceback
 from re import sub
 from typing import Optional
 from uuid import UUID
 from fastapi import APIRouter, FastAPI, HTTPException
-from fastapi.responses import JSONResponse
 from starlette.middleware.cors import CORSMiddleware
-from registry.purview_registry import PurviewRegistry, ConflictError
+from registry import *
+from registry.purview_registry import PurviewRegistry
 from registry.models import AnchorDef, AnchorFeatureDef, DerivedFeatureDef, EntityType, ProjectDef, SourceDef, to_snake
 
 rp = "/v1"
@@ -44,48 +43,6 @@ def to_camel(s):
                    allow_headers=["*"],
                    )
 
-def exc_to_content(e: Exception) -> dict:
-    content={"message": str(e)}
-    if os.environ.get("REGISTRY_DEBUGGING"):
-        content["traceback"] = "".join(traceback.TracebackException.from_exception(e).format())
-    return content
-
-@app.exception_handler(ConflictError)
-async def conflict_error_handler(_, exc: ConflictError):
-    return JSONResponse(
-        status_code=409,
-        content=exc_to_content(exc),
-    )
-
-
-@app.exception_handler(ValueError)
-async def value_error_handler(_, exc: ValueError):
-    return JSONResponse(
-        status_code=400,
-        content=exc_to_content(exc),
-    )
-
-@app.exception_handler(TypeError)
-async def type_error_handler(_, exc: ValueError):
-    return JSONResponse(
-        status_code=400,
-        content=exc_to_content(exc),
-    )
-
-
-@app.exception_handler(KeyError)
-async def key_error_handler(_, exc: KeyError):
-    return JSONResponse(
-        status_code=404,
-        content=exc_to_content(exc),
-    )
-
-@app.exception_handler(IndexError)
-async def index_error_handler(_, exc: IndexError):
-    return JSONResponse(
-        status_code=404,
-        content=exc_to_content(exc),
-    )
 
 @router.get("/projects",tags=["Project"])
 def get_projects() -> list[str]:
diff --git a/registry/purview-registry/registry/purview_registry.py b/registry/purview-registry/registry/purview_registry.py
index 06d7bd8d1..9f5f47560 100644
--- a/registry/purview-registry/registry/purview_registry.py
+++ b/registry/purview-registry/registry/purview_registry.py
@@ -1,6 +1,8 @@
 import copy
+from http.client import CONFLICT, HTTPException
 import itertools
-from typing import Optional, Tuple, Union
+from typing import Any, Optional, Tuple, Union
+from urllib.error import HTTPError
 from uuid import UUID
 
 from azure.identity import DefaultAzureCredential
@@ -9,7 +11,7 @@
 from pyapacheatlas.core import (AtlasEntity, AtlasProcess,
                                 PurviewClient)
 from pyapacheatlas.core.typedef import (AtlasAttributeDef,Cardinality,EntityTypeDef)
-from pyapacheatlas.core.util import GuidTracker, AtlasException
+from pyapacheatlas.core.util import GuidTracker
 from pyhocon import ConfigFactory
 
 from registry.interface import Registry
@@ -21,10 +23,6 @@
 TYPEDEF_ARRAY_ANCHOR=f"array<feathr_anchor_v1>"
 TYPEDEF_ARRAY_DERIVED_FEATURE=f"array<feathr_derived_feature_v1>"
 TYPEDEF_ARRAY_ANCHOR_FEATURE=f"array<feathr_anchor_feature_v1>"
-
-class ConflictError(Exception):
-    pass
-
 class PurviewRegistry(Registry):
     def __init__(self,azure_purview_name: str, registry_delimiter: str = "__", credential=None,register_types = True):
         self.registry_delimiter = registry_delimiter
@@ -570,22 +568,18 @@ def _register_feathr_feature_types(self):
     def _upload_entity_batch(self, entity_batch:list[AtlasEntity]):
         # we only support entity creation, update is not supported. 
         # setting lastModifiedTS ==0 will ensure this, if another entity with ts>=1 exist
-        # upload function will fail with 412 Precondition fail.
+        # upload funtion will fail with 412 Precondition fail.
         for entity in entity_batch:
             entity.lastModifiedTS="0"
-            try:
-                results = self.purview_client.upload_entities(
-                    batch=entity)
-                if results:
-                    dict = {x.guid: x for x in entity_batch}
-                    for k, v in results['guidAssignments'].items():
-                        dict[k].guid = v
-                else:
-                    raise RuntimeError("Feature registration failed.", results)
-            except AtlasException as e:
-                if "PreConditionCheckFailed" in e.args[0]:
-                    raise ConflictError(f"Entity {entity.guid}, {entity.typeName} -- {entity.qualifiedName} already exists in Purview. Please use a new name.")
-
+            results = self.purview_client.upload_entities(
+                batch=entity)
+            if results:
+                dict = {x.guid: x for x in entity_batch}
+                for k, v in results['guidAssignments'].items():
+                    dict[k].guid = v
+            else:
+                raise RuntimeError("Feature registration failed.", results)            
+            
     def _generate_fully_qualified_name(self, segments):
         return self.registry_delimiter.join(segments)
 

From 6d1e7a698334ced9612b2f9ae645968fefbc1808 Mon Sep 17 00:00:00 2001
From: Jinghui Mo <jmo@linkedin.com>
Date: Wed, 5 Oct 2022 16:15:17 -0400
Subject: [PATCH 03/68] Improve Avro GenericRecord and SpecificRecord based
 row-level extractor performance (#723)

* 1. In SparkRowExtractor.scala, add new extractor method which can be extended to do batch preprocess source dataframe into RDD[IndexRecord].
2. In FeatureTransformation.scala, add logic to extract features from RDD[IndexedRecord].
3. Improve some error messages.
---
 .../feathr/common/AnchorExtractor.scala       |   8 +-
 .../feathr/common/CanConvertToAvroRDD.scala   |  20 ++
 .../feathr/common/SparkRowExtractor.scala     |   6 +-
 .../SimpleConfigurableAnchorExtractor.scala   |   7 +-
 .../keyExtractor/MVELSourceKeyExtractor.scala |   7 +-
 .../offline/config/FeathrConfigLoader.scala   |   2 +-
 .../StreamingFeatureGenerator.scala           |   4 +-
 .../offline/job/FeatureTransformation.scala   | 259 +++++++++++++++++-
 .../DataFrameBasedRowEvaluator.scala          |  27 +-
 .../DefaultValueSubstituter.scala             |   2 +-
 .../transformation/FDSConversionUtils.scala   |   2 +-
 .../util/FeatureValueTypeValidator.scala      |  24 +-
 .../offline/util/FeaturizedDatasetUtils.scala |   2 +-
 .../util/TestFeatureValueTypeValidator.scala  |   4 +-
 14 files changed, 318 insertions(+), 56 deletions(-)
 create mode 100644 src/main/scala/com/linkedin/feathr/common/CanConvertToAvroRDD.scala

diff --git a/src/main/scala/com/linkedin/feathr/common/AnchorExtractor.scala b/src/main/scala/com/linkedin/feathr/common/AnchorExtractor.scala
index 2e38e4d04..185c9d2d6 100644
--- a/src/main/scala/com/linkedin/feathr/common/AnchorExtractor.scala
+++ b/src/main/scala/com/linkedin/feathr/common/AnchorExtractor.scala
@@ -1,7 +1,5 @@
 package com.linkedin.feathr.common
 
-import org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema
-
 /**
   * Provides feature values based on some "raw" data element
  *
@@ -39,12 +37,14 @@ trait AnchorExtractor[T] extends AnchorExtractorBase[T] with SparkRowExtractor {
    * @param datum input row
    * @return list of feature keys
    */
-  def getKeyFromRow(datum: GenericRowWithSchema): Seq[String] = getKey(datum.asInstanceOf[T])
+  def getKeyFromRow(datum: Any): Seq[String] = getKey(datum.asInstanceOf[T])
 
   /**
    * Get the feature value from the row
    * @param datum input row
    * @return A map of feature name to feature value
    */
-  def getFeaturesFromRow(datum: GenericRowWithSchema): Map[String, FeatureValue] = getFeatures(datum.asInstanceOf[T])
+  def getFeaturesFromRow(datum: Any): Map[String, FeatureValue] = getFeatures(datum.asInstanceOf[T])
+
+  override def toString: String = getClass.getSimpleName
 }
diff --git a/src/main/scala/com/linkedin/feathr/common/CanConvertToAvroRDD.scala b/src/main/scala/com/linkedin/feathr/common/CanConvertToAvroRDD.scala
new file mode 100644
index 000000000..7051a308c
--- /dev/null
+++ b/src/main/scala/com/linkedin/feathr/common/CanConvertToAvroRDD.scala
@@ -0,0 +1,20 @@
+package com.linkedin.feathr.common
+
+import org.apache.avro.generic.IndexedRecord
+import org.apache.spark.rdd.RDD
+import org.apache.spark.sql.DataFrame
+
+/**
+ * If an AnchorExtractor only works on a Avro record, it should extends
+ * this trait, and use convertToAvroRdd to do a one-time batch conversion of DataFrame to RDD of their choice.
+ * convertToAvroRdd will be called by Feathr engine before calling getKeyFromRow() and getFeaturesFromRow() in AnchorExtractor.
+ */
+trait CanConvertToAvroRDD {
+
+  /**
+   * One time batch converting the input data source into a RDD[IndexedRecord] for feature extraction later
+   * @param df input data source
+   * @return batch preprocessed dataframe, as RDD[IndexedRecord]
+   */
+  def convertToAvroRdd(df: DataFrame) : RDD[IndexedRecord]
+}
diff --git a/src/main/scala/com/linkedin/feathr/common/SparkRowExtractor.scala b/src/main/scala/com/linkedin/feathr/common/SparkRowExtractor.scala
index 04e715e8c..ad088ac0a 100644
--- a/src/main/scala/com/linkedin/feathr/common/SparkRowExtractor.scala
+++ b/src/main/scala/com/linkedin/feathr/common/SparkRowExtractor.scala
@@ -1,7 +1,5 @@
 package com.linkedin.feathr.common
 
-import org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema
-
 /**
  * An extractor trait that provides APIs to transform a Spark GenericRowWithSchema into feature values
  */
@@ -12,12 +10,12 @@ trait SparkRowExtractor {
    * @param datum input row
    * @return list of feature keys
    */
-  def getKeyFromRow(datum: GenericRowWithSchema): Seq[String]
+  def getKeyFromRow(datum: Any): Seq[String]
 
   /**
    * Get the feature value from the row
    * @param datum input row
    * @return A map of feature name to feature value
    */
-  def getFeaturesFromRow(datum: GenericRowWithSchema): Map[String, FeatureValue]
+  def getFeaturesFromRow(datum: Any): Map[String, FeatureValue]
 }
\ No newline at end of file
diff --git a/src/main/scala/com/linkedin/feathr/offline/anchored/anchorExtractor/SimpleConfigurableAnchorExtractor.scala b/src/main/scala/com/linkedin/feathr/offline/anchored/anchorExtractor/SimpleConfigurableAnchorExtractor.scala
index 59f5bfbe7..edb2e2c06 100644
--- a/src/main/scala/com/linkedin/feathr/offline/anchored/anchorExtractor/SimpleConfigurableAnchorExtractor.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/anchored/anchorExtractor/SimpleConfigurableAnchorExtractor.scala
@@ -10,7 +10,6 @@ import com.linkedin.feathr.offline.mvel.plugins.FeathrExpressionExecutionContext
 import com.linkedin.feathr.offline.mvel.{MvelContext, MvelUtils}
 import com.linkedin.feathr.offline.util.FeatureValueTypeValidator
 import org.apache.log4j.Logger
-import org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema
 import org.apache.spark.sql.types._
 import org.mvel2.MVEL
 
@@ -66,7 +65,7 @@ private[offline] class SimpleConfigurableAnchorExtractor( @JsonProperty("key") k
    * @param datum input row
    * @return list of feature keys
    */
-  override def getKeyFromRow(datum: GenericRowWithSchema): Seq[String] = {
+  override def getKeyFromRow(datum: Any): Seq[String] = {
     getKey(datum.asInstanceOf[Any])
   }
 
@@ -107,7 +106,7 @@ private[offline] class SimpleConfigurableAnchorExtractor( @JsonProperty("key") k
    * @param row input row
    *  @return A map of feature name to feature value
    */
-  override def getFeaturesFromRow(row: GenericRowWithSchema) = {
+  override def getFeaturesFromRow(row: Any) = {
     getFeatures(row.asInstanceOf[Any])
   }
 
@@ -147,7 +146,7 @@ private[offline] class SimpleConfigurableAnchorExtractor( @JsonProperty("key") k
       featureTypeConfigs(featureRefStr)
     }
     val featureValue = offline.FeatureValue.fromTypeConfig(value, featureTypeConfig)
-    FeatureValueTypeValidator.validate(featureValue, featureTypeConfigs(featureRefStr))
+    FeatureValueTypeValidator.validate(featureRefStr, featureValue, featureTypeConfigs(featureRefStr) )
     (featureRefStr, featureValue)
   }
 
diff --git a/src/main/scala/com/linkedin/feathr/offline/anchored/keyExtractor/MVELSourceKeyExtractor.scala b/src/main/scala/com/linkedin/feathr/offline/anchored/keyExtractor/MVELSourceKeyExtractor.scala
index 209ac89e1..bf5108e8b 100644
--- a/src/main/scala/com/linkedin/feathr/offline/anchored/keyExtractor/MVELSourceKeyExtractor.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/anchored/keyExtractor/MVELSourceKeyExtractor.scala
@@ -43,7 +43,7 @@ private[feathr] class MVELSourceKeyExtractor(val anchorExtractorV1: AnchorExtrac
       .toDF()
   }
 
-  def getKey(datum: GenericRowWithSchema): Seq[String] = {
+  def getKey(datum: Any): Seq[String] = {
     anchorExtractorV1.getKeyFromRow(datum)
   }
 
@@ -55,7 +55,7 @@ private[feathr] class MVELSourceKeyExtractor(val anchorExtractorV1: AnchorExtrac
    */
   override def getKeyColumnNames(datum: Option[Any]): Seq[String] = {
     if (datum.isDefined) {
-      val size = getKey(datum.get.asInstanceOf[GenericRowWithSchema]).size
+      val size = getKey(datum.get).size
       (1 to size).map(JOIN_KEY_PREFIX + _)
     } else {
       // return empty join key to signal empty dataset
@@ -86,5 +86,6 @@ private[feathr] class MVELSourceKeyExtractor(val anchorExtractorV1: AnchorExtrac
   // this helps to reduce the number of joins
   // to the observation data
   // The default toString does not work, because toString of each object have different values
-  override def toString: String = getClass.getSimpleName + " with keyExprs:" + keyExprs.mkString(" key:")
+  override def toString: String = getClass.getSimpleName + " with keyExprs:" + keyExprs.mkString(" key:") +
+    "anchorExtractor:" + anchorExtractorV1.toString
 }
diff --git a/src/main/scala/com/linkedin/feathr/offline/config/FeathrConfigLoader.scala b/src/main/scala/com/linkedin/feathr/offline/config/FeathrConfigLoader.scala
index 1faf0d814..e2ec6e588 100644
--- a/src/main/scala/com/linkedin/feathr/offline/config/FeathrConfigLoader.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/config/FeathrConfigLoader.scala
@@ -327,7 +327,7 @@ private[offline] class AnchorLoader extends JsonDeserializer[FeatureAnchor] {
             case Some(tType) => offline.FeatureValue.fromTypeConfig(rawValue, tType)
             case None => offline.FeatureValue(rawValue, featureType, key)
           }
-          FeatureValueTypeValidator.validate(featureValue, featureTypeConfig)
+          FeatureValueTypeValidator.validate(featureValue, featureTypeConfig, key)
           (key, featureValue)
       }
       .toMap
diff --git a/src/main/scala/com/linkedin/feathr/offline/generation/StreamingFeatureGenerator.scala b/src/main/scala/com/linkedin/feathr/offline/generation/StreamingFeatureGenerator.scala
index 99436b93c..126128323 100644
--- a/src/main/scala/com/linkedin/feathr/offline/generation/StreamingFeatureGenerator.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/generation/StreamingFeatureGenerator.scala
@@ -6,7 +6,7 @@ import com.linkedin.feathr.common.JoiningFeatureParams
 import com.linkedin.feathr.offline.config.location.KafkaEndpoint
 import com.linkedin.feathr.offline.generation.outputProcessor.PushToRedisOutputProcessor.TABLE_PARAM_CONFIG_NAME
 import com.linkedin.feathr.offline.generation.outputProcessor.RedisOutputUtils
-import com.linkedin.feathr.offline.job.FeatureTransformation.getFeatureJoinKey
+import com.linkedin.feathr.offline.job.FeatureTransformation.getFeatureKeyColumnNames
 import com.linkedin.feathr.offline.job.{FeatureGenSpec, FeatureTransformation}
 import com.linkedin.feathr.offline.logical.FeatureGroups
 import com.linkedin.feathr.offline.source.accessor.DataPathHandler
@@ -111,7 +111,7 @@ class StreamingFeatureGenerator(dataPathHandlers: List[DataPathHandler]) {
           // Apply feature transformation
           val transformedResult = DataFrameBasedSqlEvaluator.transform(anchor.featureAnchor.extractor.asInstanceOf[SimpleAnchorExtractorSpark],
             withKeyColumnDF, featureNamePrefixPairs, anchor.featureAnchor.featureTypeConfigs)
-          val outputJoinKeyColumnNames = getFeatureJoinKey(keyExtractor, withKeyColumnDF)
+          val outputJoinKeyColumnNames = getFeatureKeyColumnNames(keyExtractor, withKeyColumnDF)
           val selectedColumns = outputJoinKeyColumnNames ++ anchor.selectedFeatures.filter(keyTaggedFeatures.map(_.featureName).contains(_))
           val cleanedDF = transformedResult.df.select(selectedColumns.head, selectedColumns.tail:_*)
           val keyColumnNames = FeatureTransformation.getStandardizedKeyNames(outputJoinKeyColumnNames.size)
diff --git a/src/main/scala/com/linkedin/feathr/offline/job/FeatureTransformation.scala b/src/main/scala/com/linkedin/feathr/offline/job/FeatureTransformation.scala
index 94de8e645..7b106572b 100644
--- a/src/main/scala/com/linkedin/feathr/offline/job/FeatureTransformation.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/job/FeatureTransformation.scala
@@ -1,7 +1,9 @@
 package com.linkedin.feathr.offline.job
 
-import com.linkedin.feathr.common._
 import com.linkedin.feathr.common.exception.{ErrorLabel, FeathrException, FeathrFeatureTransformationException}
+import com.linkedin.feathr.common.tensor.TensorData
+import com.linkedin.feathr.common.types.FeatureType
+import com.linkedin.feathr.common.{AnchorExtractorBase, _}
 import com.linkedin.feathr.offline.anchored.anchorExtractor.{SQLConfigurableAnchorExtractor, SimpleConfigurableAnchorExtractor, TimeWindowConfigurableAnchorExtractor}
 import com.linkedin.feathr.offline.anchored.feature.{FeatureAnchor, FeatureAnchorWithSource}
 import com.linkedin.feathr.offline.anchored.keyExtractor.MVELSourceKeyExtractor
@@ -22,6 +24,7 @@ import com.linkedin.feathr.offline.{FeatureDataFrame, JoinKeys}
 import com.linkedin.feathr.sparkcommon.{SimpleAnchorExtractorSpark, SourceKeyExtractor}
 import com.linkedin.feathr.swj.aggregate.AggregationType
 import com.linkedin.feathr.{common, offline}
+import org.apache.avro.generic.IndexedRecord
 import org.apache.log4j.Logger
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.functions._
@@ -41,6 +44,16 @@ import scala.concurrent.{Await, ExecutionContext, Future}
  */
 private[offline] case class AnchorFeatureGroups(anchorsWithSameSource: Seq[FeatureAnchorWithSource], requestedFeatures: Seq[String])
 
+/**
+ * Context info needed in feature transformation
+ * @param featureAnchorWithSource feature annchor with its source
+ * @param featureNamePrefixPairs map of feature name to its prefix
+ * @param transformer transformer of anchor
+ */
+private[offline] case class TransformInfo(featureAnchorWithSource: FeatureAnchorWithSource,
+                                 featureNamePrefixPairs: Seq[(FeatureName, FeatureName)],
+                                 transformer: AnchorExtractorBase[IndexedRecord])
+
 /**
  * Represent the transformed result of an anchor extractor after evaluating its features
  * @param featureNameAndPrefixPairs pairs of feature name and feature name prefix
@@ -75,7 +88,27 @@ private[offline] object FeatureTransformation {
   // feature name, column prefix
   type FeatureNameAndColumnPrefix = (String, String)
 
-  def getFeatureJoinKey(sourceKeyExtractor: SourceKeyExtractor, withKeyColumnDF: DataFrame, featureExtractor: Option[AnyRef] = None): Seq[String] = {
+  /**
+   * Extract feature key column names from the input feature RDD using the sourceKeyExtractor.
+   * @param sourceKeyExtractor key extractor that knows what are the key column in a feature RDD.
+   * @param withKeyColumnRDD RDD that contains the key columns.
+   * @return feature key column names
+   */
+  def getFeatureKeyColumnNamesRdd(sourceKeyExtractor: SourceKeyExtractor, withKeyColumnRDD: RDD[_]): Seq[String] = {
+    if (withKeyColumnRDD.isEmpty) {
+      sourceKeyExtractor.getKeyColumnNames(None)
+    } else {
+      sourceKeyExtractor.getKeyColumnNames(Some(withKeyColumnRDD.first()))
+    }
+  }
+
+  /**
+   * Extract feature key column names from the input feature DataFrame using the sourceKeyExtractor.
+   * @param sourceKeyExtractor key extractor that knows what are the key column in a feature RDD.
+   * @param withKeyColumnDF DataFrame that contains the key columns.
+   * @return feature key column names
+   */
+  def getFeatureKeyColumnNames(sourceKeyExtractor: SourceKeyExtractor, withKeyColumnDF: DataFrame): Seq[String] = {
       if (withKeyColumnDF.head(1).isEmpty) {
         sourceKeyExtractor.getKeyColumnNames(None)
       } else {
@@ -306,7 +339,8 @@ private[offline] object FeatureTransformation {
     }
 
     val withKeyColumnDF = keyExtractor.appendKeyColumns(sourceDF)
-    val outputJoinKeyColumnNames = getFeatureJoinKey(keyExtractor, withKeyColumnDF, Some(anchorFeatureGroup.anchorsWithSameSource.head.featureAnchor.extractor))
+
+    val outputJoinKeyColumnNames = getFeatureKeyColumnNames(keyExtractor, withKeyColumnDF)
     val filteredFactData = applyBloomFilter((keyExtractor, withKeyColumnDF), bloomFilter)
 
     // 1. apply all transformations on the dataframe in sequential order
@@ -457,10 +491,21 @@ private[offline] object FeatureTransformation {
           val keyExtractor = anchorsWithSameSource.head._1.featureAnchor.sourceKeyExtractor
           val featureAnchorWithSource = anchorsWithSameSource.keys.toSeq
           val selectedFeatures = anchorsWithSameSource.flatMap(_._2.featureNames).toSeq
-
-          val sourceDF = featureGroupingFactors.source
-          val transformedResults: Seq[KeyedTransformedResult] = transformMultiAnchorsOnSingleDataFrame(sourceDF,
+          val isAvroRddBasedExtractor = featureAnchorWithSource
+            .map(_.featureAnchor.extractor)
+            .filter(extractor => extractor.isInstanceOf[CanConvertToAvroRDD]
+          ).nonEmpty
+          val transformedResults: Seq[KeyedTransformedResult] = if (isAvroRddBasedExtractor) {
+              // If there are features are defined using AVRO record based extractor, run RDD based feature transformation
+              val sourceAccessor = featureGroupingFactors.source
+              val sourceRdd = sourceAccessor.asInstanceOf[NonTimeBasedDataSourceAccessor].get()
+              val featureTypeConfigs = featureAnchorWithSource.flatMap(featureAnchor => featureAnchor.featureAnchor.featureTypeConfigs).toMap
+              Seq(transformFeaturesOnAvroRecord(sourceRdd, keyExtractor, featureAnchorWithSource, bloomFilter, selectedFeatures, featureTypeConfigs))
+            } else {
+              val sourceDF = featureGroupingFactors.source
+              transformFeaturesOnDataFrameRow(sourceDF,
                 keyExtractor, featureAnchorWithSource, bloomFilter, selectedFeatures, incrementalAggContext, mvelContext)
+            }
 
           val res = transformedResults
             .map { transformedResultWithKey =>
@@ -673,6 +718,204 @@ private[offline] object FeatureTransformation {
     }
   }
 
+
+  /**
+   * Apply a bloomfilter to a RDD
+   *
+   * @param keyExtractor key extractor to extract the key values from the RDD
+   * @param rdd RDD to filter
+   * @param bloomFilter bloomfilter used to filter out unwanted row in the RDD based on key columns
+   * @return filtered RDD
+   */
+
+  private def applyBloomFilterRdd(keyExtractor: SourceKeyExtractor, rdd: RDD[IndexedRecord], bloomFilter: Option[BloomFilter]): RDD[IndexedRecord] = {
+    bloomFilter match {
+      case None =>
+        // no bloom filter, use data as it
+        rdd
+      case Some(filter) =>
+        // get the list of join key columns or expression
+        keyExtractor match {
+          case extractor: MVELSourceKeyExtractor =>
+            // get the list of join key columns or expression
+            val keyColumnsList = if (rdd.isEmpty) {
+              extractor.getKeyColumnNames(None)
+            } else {
+              extractor.getKeyColumnNames(Some(rdd.first))
+            }
+            if (!keyColumnsList.isEmpty) {
+              val filtered = rdd.filter { record: Any =>
+                val keyVals = extractor.getKey(record)
+                // if key is not in observation, skip it
+                if (keyVals != null && keyVals.count(_ == null) == 0) {
+                  filter.mightContainString(SourceUtils.generateFilterKeyString(keyVals))
+                } else {
+                  false
+                }
+              }
+              filtered
+            } else {
+              // expand feature for seq join does not have right key, so we allow empty here
+              rdd
+            }
+          case _ => throw new FeathrFeatureTransformationException(ErrorLabel.FEATHR_USER_ERROR, "No source key extractor found")
+        }
+    }
+  }
+
+  /**
+   * Transform features defined in a group of anchors based on same source
+   * This is for the AVRO record based extractors
+   *
+   * @param rdd source that requested features are defined on
+   * @param keyExtractor key extractor to apply on source rdd
+   * @param featureAnchorWithSources feature anchors defined on source rdd to be evaluated
+   * @param bloomFilter bloomfilter to apply on source rdd
+   * @param requestedFeatureNames requested features
+   * @param featureTypeConfigs user specified feature types
+   * @return TransformedResultWithKey The output feature DataFrame conforms to FDS format
+   */
+  private def transformFeaturesOnAvroRecord(df: DataFrame,
+                                            keyExtractor: SourceKeyExtractor,
+                                            featureAnchorWithSources: Seq[FeatureAnchorWithSource],
+                                            bloomFilter: Option[BloomFilter],
+                                            requestedFeatureNames: Seq[FeatureName],
+                                            featureTypeConfigs: Map[String, FeatureTypeConfig] = Map()): KeyedTransformedResult = {
+    if (!keyExtractor.isInstanceOf[MVELSourceKeyExtractor]) {
+      throw new FeathrException(ErrorLabel.FEATHR_ERROR, s"Error processing requested Feature :${requestedFeatureNames}. " +
+        s"Key extractor ${keyExtractor} must extends MVELSourceKeyExtractor.")
+    }
+    val extractor = keyExtractor.asInstanceOf[MVELSourceKeyExtractor]
+    if (!extractor.anchorExtractorV1.isInstanceOf[CanConvertToAvroRDD]) {
+      throw new FeathrException(ErrorLabel.FEATHR_ERROR, s"Error processing requested Feature :${requestedFeatureNames}. " +
+        s"isLowLevelRddExtractor() should return true and convertToAvroRdd should be implemented.")
+    }
+    val rdd = extractor.anchorExtractorV1.asInstanceOf[CanConvertToAvroRDD].convertToAvroRdd(df)
+    val filteredFactData = applyBloomFilterRdd(keyExtractor, rdd, bloomFilter)
+
+    // Build a sequence of 3-tuple of (FeatureAnchorWithSource, featureNamePrefixPairs, AnchorExtractorBase)
+    val transformInfo = featureAnchorWithSources map { featureAnchorWithSource =>
+      val extractor = featureAnchorWithSource.featureAnchor.extractor
+      extractor match {
+        case transformer: AnchorExtractorBase[IndexedRecord] =>
+          // We no longer need prefix for the simplicity of the implementation, instead if there's a feature name
+          // and source data field clash, we will throw exception and ask user to rename the feature.
+          val featureNamePrefix = ""
+          val featureNames = featureAnchorWithSource.selectedFeatures.filter(requestedFeatureNames.contains)
+          val featureNamePrefixPairs = featureNames.map((_, featureNamePrefix))
+          TransformInfo(featureAnchorWithSource, featureNamePrefixPairs, transformer)
+
+        case _ =>
+          throw new FeathrFeatureTransformationException(ErrorLabel.FEATHR_USER_ERROR, s"Unsupported transformer $extractor for features: $requestedFeatureNames")
+      }
+    }
+
+    // to avoid name conflict between feature names and the raw data field names
+    val sourceKeyExtractors = transformInfo.map(_.featureAnchorWithSource.featureAnchor.sourceKeyExtractor)
+    assert(sourceKeyExtractors.map(_.toString).distinct.size == 1)
+
+    val transformers = transformInfo map (_.transformer)
+
+    /*
+     * Transform the given RDD by applying extractors to each row to create an RDD[Row] where each Row
+     * represents keys and feature values
+     */
+    val spark = SparkSession.builder().getOrCreate()
+    val userProvidedFeatureTypes = transformInfo.flatMap(_.featureAnchorWithSource.featureAnchor.getFeatureTypes.getOrElse(Map.empty[String, FeatureTypes])).toMap
+    val FeatureTypeInferenceContext(featureTypeAccumulators) =
+      FeatureTransformation.getTypeInferenceContext(spark, userProvidedFeatureTypes, requestedFeatureNames)
+    val transformedRdd = filteredFactData map { record =>
+      val (keys, featureValuesWithType) = transformAvroRecord(requestedFeatureNames, sourceKeyExtractors, transformers, record, featureTypeConfigs)
+      requestedFeatureNames.zip(featureValuesWithType).foreach {
+        case (featureRef, (_, featureType)) =>
+          if (featureTypeAccumulators(featureRef).isZero && featureType != null) {
+            // This is lazy evaluated
+            featureTypeAccumulators(featureRef).add(FeatureTypes.valueOf(featureType.getBasicType.toString))
+          }
+      }
+      // Create a row by merging a row created from keys and a row created from term-vectors/tensors
+      Row.merge(Row.fromSeq(keys), Row.fromSeq(featureValuesWithType.map(_._1)))
+    }
+
+    // Create a DataFrame from the above obtained RDD
+    val keyNames = getFeatureKeyColumnNamesRdd(sourceKeyExtractors.head, filteredFactData)
+    val (outputSchema, inferredFeatureTypeConfigs) = {
+      val allFeatureTypeConfigs = featureAnchorWithSources.flatMap(featureAnchorWithSource => featureAnchorWithSource.featureAnchor.featureTypeConfigs).toMap
+      val inferredFeatureTypes = inferFeatureTypes(featureTypeAccumulators, transformedRdd, requestedFeatureNames)
+      val inferredFeatureTypeConfigs = inferredFeatureTypes.map(x => x._1 -> new FeatureTypeConfig(x._2))
+      val mergedFeatureTypeConfig = inferredFeatureTypeConfigs ++ allFeatureTypeConfigs
+      val colPrefix = ""
+      val featureTensorTypeInfo = getFDSSchemaFields(requestedFeatureNames, mergedFeatureTypeConfig, colPrefix)
+      val structFields = keyNames.foldRight(List.empty[StructField]) {
+        case (colName, acc) =>
+          StructField(colName, StringType) :: acc
+      }
+      val outputSchema = StructType(StructType(structFields ++ featureTensorTypeInfo))
+      (outputSchema, mergedFeatureTypeConfig)
+    }
+    val transformedDF = spark.createDataFrame(transformedRdd, outputSchema)
+
+    val featureFormat = FeatureColumnFormat.FDS_TENSOR
+    val featureColumnFormats = requestedFeatureNames.map(name => name -> featureFormat).toMap
+    val transformedInfo = TransformedResult(transformInfo.flatMap(_.featureNamePrefixPairs), transformedDF, featureColumnFormats, inferredFeatureTypeConfigs)
+    KeyedTransformedResult(keyNames, transformedInfo)
+  }
+
+  /**
+   * Apply a keyExtractor and feature transformer on a Record to extractor feature values.
+   * @param requestedFeatureNames requested feature names in the output. Extractors may produce more features than requested.
+   * @param sourceKeyExtractors extractor to extract the key from the record
+   * @param transformers transform to produce the feature value from the record
+   * @param record avro record to work on
+   * @param featureTypeConfigs user defined feature types
+   * @return tuple of (feature join key, sequence of (feature value, feature type) in the order of requestedFeatureNames)
+   */
+  private def transformAvroRecord(
+                                   requestedFeatureNames: Seq[FeatureName],
+                                   sourceKeyExtractors: Seq[SourceKeyExtractor],
+                                   transformers: Seq[AnchorExtractorBase[IndexedRecord]],
+                                   record: IndexedRecord,
+                                   featureTypeConfigs: Map[String, FeatureTypeConfig] = Map()): (Seq[String], Seq[(Any, FeatureType)]) = {
+    val keys = sourceKeyExtractors.head match {
+      case mvelSourceKeyExtractor: MVELSourceKeyExtractor => mvelSourceKeyExtractor.getKey(record)
+      case _ => throw new FeathrFeatureTransformationException(ErrorLabel.FEATHR_USER_ERROR, s"${sourceKeyExtractors.head} is not a valid extractor on RDD")
+    }
+
+    /*
+     * For the given row, apply all extractors to extract feature values. If requested as tensors, each feature value
+     * contains a tensor else a term-vector.
+     */
+    val features = transformers map {
+      case extractor: AnchorExtractor[IndexedRecord] =>
+        val features = extractor.getFeatures(record)
+        FeatureValueTypeValidator.validate(features, featureTypeConfigs)
+        features
+      case extractor =>
+        throw new FeathrFeatureTransformationException(
+          ErrorLabel.FEATHR_USER_ERROR,
+          s"Invalid extractor $extractor for features:" +
+            s"$requestedFeatureNames requested as tensors")
+    } reduce (_ ++ _)
+    if (logger.isTraceEnabled) {
+      logger.trace(s"Extracted features: $features")
+    }
+
+    /*
+     * Retain feature values for only the requested features, and represent each feature value as
+     * a tensor, as specified.
+     */
+    val featureValuesWithType = requestedFeatureNames map { name =>
+      features.get(name) map {
+        case featureValue =>
+          val tensorData: TensorData = featureValue.getAsTensorData()
+          val featureType: FeatureType = featureValue.getFeatureType()
+          val row = FeaturizedDatasetUtils.tensorToFDSDataFrameRow(tensorData)
+          (row, featureType)
+      } getOrElse ((null, null)) // return null if no feature value present
+    }
+    (keys, featureValuesWithType)
+  }
+
   /**
     * Helper function to be used by groupFeatures. Given a collection of feature anchors which also contains information about grouping
     * criteria and extractor type per feature anchor, returns a map of FeatureGroupingCriteria to
@@ -851,7 +1094,7 @@ private[offline] object FeatureTransformation {
    *         others use direct aggregation
    *
    */
-  private def transformMultiAnchorsOnSingleDataFrame(
+  private def transformFeaturesOnDataFrameRow(
       source: DataSourceAccessor,
       keyExtractor: SourceKeyExtractor,
       anchorsWithSameSource: Seq[FeatureAnchorWithSource],
@@ -878,7 +1121,7 @@ private[offline] object FeatureTransformation {
         val incrAggCtx = incrementalAggContext.get
         val preAggDFs = incrAggCtx.previousSnapshotMap.collect { case (featureName, df) if requestedFeatures.exists(df.columns.contains) => df }.toSeq.distinct
         // join each previous aggregation dataframe sequentially
-        val groupKeys = getFeatureJoinKey(keyExtractor, preAggDFs.head)
+        val groupKeys = getFeatureKeyColumnNames(keyExtractor, preAggDFs.head)
         val keyColumnNames = getStandardizedKeyNames(groupKeys.size)
         val firstPreAgg = preAggDFs.head
         val joinedPreAggDFs = preAggDFs
diff --git a/src/main/scala/com/linkedin/feathr/offline/transformation/DataFrameBasedRowEvaluator.scala b/src/main/scala/com/linkedin/feathr/offline/transformation/DataFrameBasedRowEvaluator.scala
index d242372bf..cc6cba1c7 100644
--- a/src/main/scala/com/linkedin/feathr/offline/transformation/DataFrameBasedRowEvaluator.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/transformation/DataFrameBasedRowEvaluator.scala
@@ -74,19 +74,20 @@ private[offline] object DataFrameBasedRowEvaluator {
     val featureTypes = featureTypeConfigs.mapValues(_.getFeatureType)
     val FeatureTypeInferenceContext(featureTypeAccumulators) =
       FeatureTransformation.getTypeInferenceContext(spark, featureTypes, featureRefStrs)
+
     val transformedRdd = inputDF.rdd.map(row => {
-      // in some cases, the input dataframe row here only have Row and does not have schema attached,
-      // while MVEL only works with GenericRowWithSchema, create it manually
-      val rowWithSchema = if (row.isInstanceOf[GenericRowWithSchema]) {
-        row.asInstanceOf[GenericRowWithSchema]
-      } else {
-        new GenericRowWithSchema(row.toSeq.toArray, inputSchema)
-      }
-      if (rowExtractor.isInstanceOf[SimpleConfigurableAnchorExtractor]) {
-        rowExtractor.asInstanceOf[SimpleConfigurableAnchorExtractor].mvelContext = mvelContext
-      }
-      val result = rowExtractor.getFeaturesFromRow(rowWithSchema)
-      val featureValues = featureRefStrs map {
+        // in some cases, the input dataframe row here only have Row and does not have schema attached,
+        // while MVEL only works with GenericRowWithSchema, create it manually
+        val rowWithSchema = if (row.isInstanceOf[GenericRowWithSchema]) {
+          row.asInstanceOf[GenericRowWithSchema]
+        } else {
+          new GenericRowWithSchema(row.toSeq.toArray, inputSchema)
+        }
+        if (rowExtractor.isInstanceOf[SimpleConfigurableAnchorExtractor]) {
+          rowExtractor.asInstanceOf[SimpleConfigurableAnchorExtractor].mvelContext = mvelContext
+        }
+        val result = rowExtractor.getFeaturesFromRow(rowWithSchema)
+        val featureValues = featureRefStrs map {
           featureRef =>
             if (result.contains(featureRef)) {
               val featureValue = result(featureRef)
@@ -95,7 +96,7 @@ private[offline] object DataFrameBasedRowEvaluator {
                 featureTypeAccumulators(featureRef).add(FeatureTypes.valueOf(rowFeatureType.toString))
               }
               val tensorData: TensorData = featureValue.getAsTensorData()
-              FeaturizedDatasetUtils.tensorToDataFrameRow(tensorData)
+              FeaturizedDatasetUtils.tensorToFDSDataFrameRow(tensorData)
             } else null
         }
         Row.merge(row, Row.fromSeq(featureValues))
diff --git a/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala b/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala
index 366967cc2..1b67d9558 100644
--- a/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala
@@ -112,7 +112,7 @@ private[offline] object DataFrameDefaultValueSubstituter extends DataFrameDefaul
         // For tensor default, since we don't have type, so we need to use expr to construct the default column
         val schema = field.dataType
         val tensorData = defaultFeatureValue.getAsTensorData
-        val ts = FeaturizedDatasetUtils.tensorToDataFrameRow(tensorData)
+        val ts = FeaturizedDatasetUtils.tensorToFDSDataFrameRow(tensorData)
         val fdsTensorDefaultUDF = getFDSTensorDefaultUDF(schema, ts)
         ss.udf.register("tz_udf", fdsTensorDefaultUDF)
         expr(s"tz_udf($featureColumnName)")
diff --git a/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala b/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala
index 824f48fe3..96a10a67c 100644
--- a/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala
@@ -37,7 +37,7 @@ private[offline] object FDSConversionUtils {
     // convert the "raw" input data into a FDS column a specific dataType
     rawFeatureValue match {
       case tensorData: TensorData =>
-        FeaturizedDatasetUtils.tensorToDataFrameRow(tensorData, Some(targetDataType))
+        FeaturizedDatasetUtils.tensorToFDSDataFrameRow(tensorData, Some(targetDataType))
       case _ =>
         targetDataType match {
           // Scalar tensor
diff --git a/src/main/scala/com/linkedin/feathr/offline/util/FeatureValueTypeValidator.scala b/src/main/scala/com/linkedin/feathr/offline/util/FeatureValueTypeValidator.scala
index ee06f3acd..aec0b1aea 100644
--- a/src/main/scala/com/linkedin/feathr/offline/util/FeatureValueTypeValidator.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/util/FeatureValueTypeValidator.scala
@@ -16,7 +16,7 @@ private[offline] object FeatureValueTypeValidator {
     features.foreach {
       case (key, value) =>
         featureTypeConfigs.get(key).foreach(
-          featureTypeConfig => FeatureValueTypeValidator.validate(value, featureTypeConfig))
+          featureTypeConfig => FeatureValueTypeValidator.validate(key, value, featureTypeConfig))
     }
   }
 
@@ -27,9 +27,9 @@ private[offline] object FeatureValueTypeValidator {
    * @param featureValue      value extracted from data
    * @param featureTypeConfig user-defined config, optional
    */
-  def validate(featureValue: FeatureValue, featureTypeConfig: Option[FeatureTypeConfig]): Unit = {
+  def validate(featureValue: FeatureValue, featureTypeConfig: Option[FeatureTypeConfig], featureName: String): Unit = {
     featureTypeConfig match {
-      case Some(f) => validate(featureValue, f)
+      case Some(f) => validate(featureName, featureValue, f)
       case None =>
     }
   }
@@ -41,31 +41,31 @@ private[offline] object FeatureValueTypeValidator {
    * @param featureValue      value extracted from data
    * @param featureTypeConfig user-defined config
    */
-  def validate(featureValue: FeatureValue, featureTypeConfig: FeatureTypeConfig): Unit = {
+  def validate(featureName: String, featureValue: FeatureValue, featureTypeConfig: FeatureTypeConfig): Unit = {
     val configFeatureTypes = featureTypeConfig.getFeatureType
     val valueBasicType = featureValue.getFeatureType.getBasicType
     if (configFeatureTypes != FeatureTypes.UNSPECIFIED) {
       if (valueBasicType != FeatureType.BasicType.TENSOR || configFeatureTypes != FeatureTypes.TENSOR) {
         if (configFeatureTypes != FeatureTypes.valueOf(valueBasicType.name)) {
-          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The FeatureValue type: " + valueBasicType
-            + " is not consistent with the type specified in the Feathr config: ." + configFeatureTypes);
+          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The FeatureValue type of : " + featureName +
+            " is " + valueBasicType + ", which is not consistent with the type specified in the Feathr config: ." + configFeatureTypes);
         }
       } else if (featureTypeConfig.getTensorType != null) {
         val configTensorType = featureTypeConfig.getTensorType
         val valueTensorType = featureValue.getAsTypedTensor.getType
         if (configTensorType.getValueType != null && configTensorType.getValueType != valueTensorType.getValueType) {
-          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The tensor value type: " + valueTensorType
-            + " is not consistent with the type specified in the Feathr config: ." + configTensorType);
+          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The tensor value type of :" + featureName +
+            " is " + valueTensorType + ", which is not consistent with the type specified in the Feathr config: ." + configTensorType);
         }
         if (configTensorType.getTensorCategory != null &&
           configTensorType.getTensorCategory != valueTensorType.getTensorCategory) {
-          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The tensor category type: " + valueTensorType
-            + " is not consistent with the type specified in the Feathr config: ." + configTensorType);
+          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The tensor category type of : " + featureName + " is "
+            + valueTensorType + ", which is not consistent with the type specified in the Feathr config: ." + configTensorType);
         }
         if (configTensorType.getDimensionTypes != null &&
           configTensorType.getDimensionTypes != valueTensorType.getDimensionTypes) {
-          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The tensor dimension type: " + valueTensorType
-            + " is not consistent with the type specified in the Feathr config: ." + configTensorType);
+          throw new FeathrException(ErrorLabel.FEATHR_USER_ERROR, "The tensor dimension type of : "  + featureName + " is "
+            + valueTensorType + ", which is not consistent with the type specified in the Feathr config: ." + configTensorType);
         }
       }
     }
diff --git a/src/main/scala/com/linkedin/feathr/offline/util/FeaturizedDatasetUtils.scala b/src/main/scala/com/linkedin/feathr/offline/util/FeaturizedDatasetUtils.scala
index d672cf5f5..534881f7a 100644
--- a/src/main/scala/com/linkedin/feathr/offline/util/FeaturizedDatasetUtils.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/util/FeaturizedDatasetUtils.scala
@@ -157,7 +157,7 @@ private[offline] object FeaturizedDatasetUtils {
    * @return the Quince-FDS struct or primitive
 
    */
-  def tensorToDataFrameRow(tensor: TensorData, targetDataType: Option[DataType] = None): Any = {
+  def tensorToFDSDataFrameRow(tensor: TensorData, targetDataType: Option[DataType] = None): Any = {
     tensor match {
       case null => null
       case _ =>
diff --git a/src/test/scala/com/linkedin/feathr/offline/util/TestFeatureValueTypeValidator.scala b/src/test/scala/com/linkedin/feathr/offline/util/TestFeatureValueTypeValidator.scala
index 1e9bae9b7..bda25b1cc 100644
--- a/src/test/scala/com/linkedin/feathr/offline/util/TestFeatureValueTypeValidator.scala
+++ b/src/test/scala/com/linkedin/feathr/offline/util/TestFeatureValueTypeValidator.scala
@@ -45,7 +45,7 @@ class TestFeatureValueTypeValidator extends TestFeathr {
       new FeatureValue(value, valueFeatureType.asInstanceOf[FeatureTypes]);
     }
     val featureTypeConfig = new FeatureTypeConfig(configFeatureTypes.asInstanceOf[FeatureTypes], configTensorType.asInstanceOf[TensorType], null)
-    FeatureValueTypeValidator.validate(featureValue, featureTypeConfig)
+    FeatureValueTypeValidator.validate("", featureValue, featureTypeConfig)
   }
 
   @DataProvider(name = "failTestCases")
@@ -75,7 +75,7 @@ class TestFeatureValueTypeValidator extends TestFeathr {
       new FeatureValue(value, valueFeatureType.asInstanceOf[FeatureTypes]);
     }
     val featureTypeConfig = new FeatureTypeConfig(configFeatureTypes.asInstanceOf[FeatureTypes], configTensorType.asInstanceOf[TensorType], null)
-    FeatureValueTypeValidator.validate(featureValue, featureTypeConfig)
+    FeatureValueTypeValidator.validate("", featureValue, featureTypeConfig)
   }
 
 

From 5fc3730907d6f4acdcec09e7fa7542d6dfc734a1 Mon Sep 17 00:00:00 2001
From: Jinghui Mo <jmo@linkedin.com>
Date: Fri, 7 Oct 2022 20:02:36 -0400
Subject: [PATCH 04/68] Save lookup feature definition to HOCON files (#732)

---
 feathr_project/feathr/definition/lookup_feature.py | 6 ++++--
 feathr_project/test/test_lookup_feature.py         | 2 ++
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/feathr_project/feathr/definition/lookup_feature.py b/feathr_project/feathr/definition/lookup_feature.py
index 647df37ce..2f1b80ccd 100644
--- a/feathr_project/feathr/definition/lookup_feature.py
+++ b/feathr_project/feathr/definition/lookup_feature.py
@@ -4,12 +4,13 @@
 from jinja2 import Template
 
 from feathr.definition.dtype import FeatureType
+from feathr.definition.feature_derivations import DerivedFeature
 from feathr.definition.feature import FeatureBase
 from feathr.definition.transformation import RowTransformation
 from feathr.definition.typed_key import DUMMY_KEY, TypedKey
 from feathr.definition.aggregation import Aggregation
 
-class LookupFeature(FeatureBase):
+class LookupFeature(DerivedFeature):
     """A lookup feature is a feature defined on top of two other features, i.e. using the feature value of the base feature as key, to lookup the feature value from the expansion feature.
     e.g. a lookup feature user_purchased_item_avg_price could be key-ed by user_id, and computed by:
     base feature is user_purchased_item_ids. For a given user_id, it returns the item ids purchased by the user.
@@ -36,7 +37,8 @@ def __init__(self,
                 key: Optional[Union[TypedKey, List[TypedKey]]] = [DUMMY_KEY],
                 registry_tags: Optional[Dict[str, str]] = None,
                 ):
-        super(LookupFeature, self).__init__(name, feature_type, key=key, registry_tags=registry_tags)
+        super(LookupFeature, self).__init__(name, feature_type, input_features=[base_feature, expansion_feature],
+                                            transform="", key=key, registry_tags=registry_tags)
         self.base_feature = base_feature
         self.expansion_feature = expansion_feature
         self.aggregation = aggregation
diff --git a/feathr_project/test/test_lookup_feature.py b/feathr_project/test/test_lookup_feature.py
index ffdb9a686..82fe385a7 100644
--- a/feathr_project/test/test_lookup_feature.py
+++ b/feathr_project/test/test_lookup_feature.py
@@ -1,6 +1,7 @@
 from feathr import Aggregation
 from feathr import Feature
 from feathr import LookupFeature
+from feathr import DerivedFeature
 from feathr import FLOAT, FLOAT_VECTOR, ValueType, INT32_VECTOR
 from feathr import TypedKey
 
@@ -39,4 +40,5 @@ def test_single_key_lookup_feature_to_config():
         }
     }"""
     assert_config_equals(lookup_feature.to_feature_config(), lookup_feature_config)
+    assert(isinstance(lookup_feature, DerivedFeature))
  
\ No newline at end of file

From 356f74b409c9e8e17a2eba51a6c21266ed465afe Mon Sep 17 00:00:00 2001
From: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
Date: Fri, 7 Oct 2022 17:03:32 -0700
Subject: [PATCH 05/68] Fix function string parsing (#725)

* Add version. Fix function string parsing

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

* Add unit test

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

* Add comments

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
---
 feathr_project/feathr/__init__.py             |  5 +++
 .../udf/_preprocessing_pyudf_manager.py       | 45 +++++++++++--------
 .../udf/test_preprocessing_pyudf_manager.py   | 15 +++++++
 3 files changed, 47 insertions(+), 18 deletions(-)
 create mode 100644 feathr_project/test/unit/udf/test_preprocessing_pyudf_manager.py

diff --git a/feathr_project/feathr/__init__.py b/feathr_project/feathr/__init__.py
index fae0cb60c..9b0cf0a49 100644
--- a/feathr_project/feathr/__init__.py
+++ b/feathr_project/feathr/__init__.py
@@ -1,3 +1,5 @@
+import pkg_resources
+
 from .client import FeathrClient
 from .spark_provider.feathr_configurations import SparkExecutionConfiguration
 from .definition.feature_derivations import *
@@ -74,3 +76,6 @@
     'FeaturePrinter',
     'SparkExecutionConfiguration',
  ]
+
+
+__version__ = pkg_resources.require("feathr")[0].version
diff --git a/feathr_project/feathr/udf/_preprocessing_pyudf_manager.py b/feathr_project/feathr/udf/_preprocessing_pyudf_manager.py
index ca7114343..55756ba3d 100644
--- a/feathr_project/feathr/udf/_preprocessing_pyudf_manager.py
+++ b/feathr_project/feathr/udf/_preprocessing_pyudf_manager.py
@@ -1,12 +1,15 @@
+import ast
 import inspect
 import os
+import pickle
 from pathlib import Path
 from typing import List, Optional, Union
-import pickle
-from feathr.definition.anchor import FeatureAnchor
+
 from jinja2 import Template
+
+from feathr.definition.anchor import FeatureAnchor
 from feathr.definition.source import HdfsSource
-import ast
+
 
 # Some metadata that are only needed by Feathr
 FEATHR_PYSPARK_METADATA = 'generated_feathr_pyspark_metadata'
@@ -42,7 +45,7 @@ def build_anchor_preprocessing_metadata(anchor_list: List[FeatureAnchor], local_
         # delete the file if it already exists to avoid caching previous results
         for f in [client_udf_repo_path, metadata_path,  pyspark_driver_path]:
             if os.path.exists(f):
-                os.remove(f) 
+                os.remove(f)
 
         for anchor in anchor_list:
             # only support batch source preprocessing for now.
@@ -73,23 +76,29 @@ def build_anchor_preprocessing_metadata(anchor_list: List[FeatureAnchor], local_
         with open(feathr_pyspark_metadata_abs_path, 'wb') as file:
             pickle.dump(features_with_preprocessing, file)
 
+
     @staticmethod
-    def _parse_function_str_for_name(source: str) -> str:
-        """
-        Use AST to parse the functions and get the name out.
+    def _parse_function_str_for_name(fn_str: str) -> str:
+        """Use AST to parse the function string and get the name out.
+
+        Args:
+            fn_str: Function code in string.
+
+        Returns:
+            Name of the function.
         """
-        if source is None:
+        if not fn_str:
             return None
-        tree = ast.parse(source)
+
+        tree = ast.parse(fn_str)
+
+        # tree.body contains a list of function definition objects parsed from the input string.
+        # Currently, we only accept a single function.
         if len(tree.body) != 1 or not isinstance(tree.body[0], ast.FunctionDef):
-            raise ValueError('provided code fragment is not a single function')
-        code = compile(source=tree, filename='custom.py',mode= 'exec')
-        # https://docs.python.org/3/library/inspect.html see the inspect module for more details
-        # tuple of names other than arguments and function locals. Assume there will be only one function, so will return the first as the name
-        for ele in code.co_consts:
-            # find the first object, that is the str, this will be the name of the function
-            if isinstance(ele, str):
-                return ele
+            raise ValueError("provided code fragment is not a single function")
+
+        # Get the function name from the function definition.
+        return tree.body[0].name
 
 
     @staticmethod
@@ -174,7 +183,7 @@ def prepare_pyspark_udf_files(feature_names: List[str], local_workspace_dir):
             client_udf_repo_path = os.path.join(local_workspace_dir, FEATHR_CLIENT_UDF_FILE_NAME)
             # write pyspark_driver_template_abs_path and then client_udf_repo_path
             filenames = [pyspark_driver_template_abs_path, client_udf_repo_path]
-                
+
             with open(pyspark_driver_path, 'w') as outfile:
                 for fname in filenames:
                     with open(fname) as infile:
diff --git a/feathr_project/test/unit/udf/test_preprocessing_pyudf_manager.py b/feathr_project/test/unit/udf/test_preprocessing_pyudf_manager.py
new file mode 100644
index 000000000..1daa87632
--- /dev/null
+++ b/feathr_project/test/unit/udf/test_preprocessing_pyudf_manager.py
@@ -0,0 +1,15 @@
+import pytest
+
+from feathr.udf._preprocessing_pyudf_manager import _PreprocessingPyudfManager
+
+
+@pytest.mark.parametrize(
+    "fn_name, fn_str",
+    [
+        ("fn_without_type_hint", "def fn_without_type_hint(a):\n  return a + 10\n"),
+        ("fn_with_type_hint", "def fn_with_type_hint(a: int) -> int:\n  return a + 10\n"),
+        ("fn_with_complex_type_hint", "def fn_with_complex_type_hint(a: Union[int, float]) -> Union[int, float]:\n  return a + 10\n"),
+    ]
+)
+def test__parse_function_str_for_name(fn_name, fn_str):
+    assert fn_name == _PreprocessingPyudfManager._parse_function_str_for_name(fn_str)

From b433039d9c416863a5ee8758a2e885fa7af5aae2 Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Tue, 11 Oct 2022 07:19:25 +0800
Subject: [PATCH 06/68] Apply a same credential within each sample (#718)

Co-authored-by: enya-yx <enya@v-ellinlu-2.fareast.corp.microsoft.com>
---
 docs/samples/fraud_detection_demo.ipynb                 | 2 +-
 docs/samples/product_recommendation_demo.ipynb          | 2 +-
 docs/samples/product_recommendation_demo_advanced.ipynb | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/samples/fraud_detection_demo.ipynb b/docs/samples/fraud_detection_demo.ipynb
index 88c672160..0f35bc3bb 100644
--- a/docs/samples/fraud_detection_demo.ipynb
+++ b/docs/samples/fraud_detection_demo.ipynb
@@ -284,7 +284,7 @@
             },
             "outputs": [],
             "source": [
-                "client = FeathrClient(config_path=tmp.name)"
+                "client = FeathrClient(config_path=tmp.name, credential=credential)"
             ]
         },
         {
diff --git a/docs/samples/product_recommendation_demo.ipynb b/docs/samples/product_recommendation_demo.ipynb
index aa7699eb5..8636bb992 100644
--- a/docs/samples/product_recommendation_demo.ipynb
+++ b/docs/samples/product_recommendation_demo.ipynb
@@ -284,7 +284,7 @@
       "metadata": {},
       "outputs": [],
       "source": [
-        "feathr_client = FeathrClient(config_path=tmp.name)"
+        "feathr_client = FeathrClient(config_path=tmp.name, credential=credential)"
       ]
     },
     {
diff --git a/docs/samples/product_recommendation_demo_advanced.ipynb b/docs/samples/product_recommendation_demo_advanced.ipynb
index fff2a1cd5..de3eb2654 100644
--- a/docs/samples/product_recommendation_demo_advanced.ipynb
+++ b/docs/samples/product_recommendation_demo_advanced.ipynb
@@ -420,7 +420,7 @@
          },
          "outputs": [],
          "source": [
-            "client = FeathrClient(config_path=tmp.name)"
+            "client = FeathrClient(config_path=tmp.name, credential=credential)"
          ]
       },
       {

From a3255976b8e9ffe993b11e1115e29704972cc1c0 Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Tue, 11 Oct 2022 13:11:31 +0800
Subject: [PATCH 07/68] Enable incremental for HDFS sink (#695)

* Enable incremental for HDFS sink

* Add docstring

* Add docs

* minor fix

* minor changes

* quick fix

Co-authored-by: enya-yx <enya@v-ellinlu-2.fareast.corp.microsoft.com>
---
 docs/concepts/materializing-features.md       | 12 +++++++++++
 .../definition/_materialization_utils.py      |  3 +++
 .../definition/materialization_settings.py    |  5 ++++-
 feathr_project/feathr/definition/sink.py      | 20 ++++++++++++++++---
 .../test/test_feature_materialization.py      |  5 +++++
 5 files changed, 41 insertions(+), 4 deletions(-)

diff --git a/docs/concepts/materializing-features.md b/docs/concepts/materializing-features.md
index 28d824525..eacf980ff 100644
--- a/docs/concepts/materializing-features.md
+++ b/docs/concepts/materializing-features.md
@@ -31,6 +31,18 @@ More reference on the APIs:
 
 In the above example, we define a Redis table called `nycTaxiDemoFeature` and materialize two features called `f_location_avg_fare` and `f_location_max_fare` to Redis.
 
+## Incremental Aggregation
+Use incremental aggregation will significantly expedite the WindowAggTransformation feature calculation. 
+For example, aggregation sum of a feature F within a 180-day window at day T can be expressed as: F(T) = F(T - 1)+DirectAgg(T-1)-DirectAgg(T - 181). 
+Once a SNAPSHOT of the first day is generated, the calculation for the following days can leverage it.
+
+A storeName is required if incremental aggregated is enabled. There could be multiple output Datasets, and each of them need to be stored in a separate folder. The storeName is used as the folder name to create under the base "path".
+
+Incremental aggregation is enabled by default when using HdfsSink.
+
+More reference on the APIs:
+- [HdfsSink API doc](https://feathr.readthedocs.io/en/latest/feathr.html#feathr.HdfsSink)
+
 ## Feature Backfill
 
 It is also possible to backfill the features till a particular time, like below. If the `BackfillTime` part is not specified, it's by default to `now()` (i.e. if not specified, it's equivalent to `BackfillTime(start=now, end=now, step=timedelta(days=1))`).
diff --git a/feathr_project/feathr/definition/_materialization_utils.py b/feathr_project/feathr/definition/_materialization_utils.py
index ef066b104..b49f7dced 100644
--- a/feathr_project/feathr/definition/_materialization_utils.py
+++ b/feathr_project/feathr/definition/_materialization_utils.py
@@ -10,6 +10,9 @@ def _to_materialization_config(settings: MaterializationSettings):
             endTime: "{{ settings.backfill_time.end.strftime('%Y-%m-%d %H:%M:%S') }}"
             endTimeFormat: "yyyy-MM-dd HH:mm:ss"
             resolution: DAILY
+            {% if settings.has_hdfs_sink == True %}
+            enableIncremental = true
+            {% endif %}
             output:[
                     {% for sink in settings.sinks %}
                         {{sink.to_feature_config()}}
diff --git a/feathr_project/feathr/definition/materialization_settings.py b/feathr_project/feathr/definition/materialization_settings.py
index 8cdc2fc71..27b644139 100644
--- a/feathr_project/feathr/definition/materialization_settings.py
+++ b/feathr_project/feathr/definition/materialization_settings.py
@@ -32,7 +32,10 @@ def __init__(self, name: str, sinks: List[Sink], feature_names: List[str], backf
         now = datetime.now()
         self.backfill_time = backfill_time if backfill_time else BackfillTime(start=now, end=now, step=timedelta(days=1))
         for sink in sinks:
-            if isinstance(sink, RedisSink):
+            if isinstance(sink, HdfsSink):
+                self.has_hdfs_sink = True
+                sink.aggregation_features = feature_names
+            elif isinstance(sink, RedisSink):
                 sink.aggregation_features = feature_names
         self.sinks = sinks
         self.feature_names = feature_names
diff --git a/feathr_project/feathr/definition/sink.py b/feathr_project/feathr/definition/sink.py
index a23718a44..71c406561 100644
--- a/feathr_project/feathr/definition/sink.py
+++ b/feathr_project/feathr/definition/sink.py
@@ -103,25 +103,35 @@ def to_argument(self):
 
 class HdfsSink(Sink):
     """Offline Hadoop HDFS-compatible(HDFS, delta lake, Azure blog storage etc) sink that is used to store feature data.
-    The result is in AVRO format.
+    The result is in AVRO format. 
+
+    Incremental aggregation is enabled by default when using HdfsSink. Use incremental aggregation will significantly expedite the WindowAggTransformation feature calculation. 
+    For example, aggregation sum of a feature F within a 180-day window at day T can be expressed as: F(T) = F(T - 1)+DirectAgg(T-1)-DirectAgg(T - 181). 
+    Once a SNAPSHOT of the first day is generated, the calculation for the following days can leverage it.  
 
     Attributes:
         output_path: output path
+        store_name: the folder name under the base "path". Used especially for the current dataset to support 'Incremental' aggregation. 
+        
     """
-    def __init__(self, output_path: str) -> None:
+    def __init__(self, output_path: str, store_name: Optional[str]="df0") -> None:
         self.output_path = output_path
-
+        self.store_name = store_name
     # Sample generated HOCON config:
     # operational: {
     #     name: testFeatureGen
     #     endTime: 2019-05-01
     #     endTimeFormat: "yyyy-MM-dd"
     #     resolution: DAILY
+    #     enableIncremental = true
     #     output:[
     #         {
     #             name: HDFS
+    #             outputFormat: RAW_DATA
     #             params: {
     #                 path: "/user/featureGen/hdfsResult/"
+    #                 features: [mockdata_a_ct_gen, mockdata_a_sample_gen]
+    #                 storeName: "yyyy/MM/dd"
     #             }
     #         }
     #     ]
@@ -132,11 +142,15 @@ def to_feature_config(self) -> str:
         tm = Template("""  
             {
                 name: HDFS
+                outputFormat: RAW_DATA
                 params: {
                     path: "{{sink.output_path}}"
                     {% if sink.aggregation_features %}
                     features: [{{','.join(sink.aggregation_features)}}]
                     {% endif %}
+                    {% if sink.store_name %}
+                    storeName: "{{sink.store_name}}"
+                    {% endif %}
                 }
             }
         """)
diff --git a/feathr_project/test/test_feature_materialization.py b/feathr_project/test/test_feature_materialization.py
index 62b84d367..edd9bb537 100644
--- a/feathr_project/test/test_feature_materialization.py
+++ b/feathr_project/test/test_feature_materialization.py
@@ -61,12 +61,17 @@ def test_feature_materialization_offline_config():
             endTime: "2020-05-20 00:00:00"
             endTimeFormat: "yyyy-MM-dd HH:mm:ss"
             resolution: DAILY
+            enableIncremental = true
             output:[
                 {
                     name: HDFS
+                    outputFormat: RAW_DATA                   
                     params: {
                         path: "abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/output/hdfs_test.avro"
+                        features: [f_location_avg_fare,f_location_max_fare]
+                        storeName: "df0"
                     }
+
                 }
             ]
         }

From bb679390b30ae270c214c799d07b2a26595f6d14 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E5=BE=90=E8=BE=B0?= <windoze@0d0a.com>
Date: Wed, 12 Oct 2022 00:16:15 +0800
Subject: [PATCH 08/68] #492 fix, fail only if different sources have same name
 (#733)

---
 feathr_project/feathr/client.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/feathr_project/feathr/client.py b/feathr_project/feathr/client.py
index f21d37d23..759a33365 100644
--- a/feathr_project/feathr/client.py
+++ b/feathr_project/feathr/client.py
@@ -216,7 +216,7 @@ def build_features(self, anchor_list: List[FeatureAnchor] = [], derived_feature_
                                    f"definitions. Anchor name of {anchor} is already defined in {anchor_names[anchor.name]}")
             else:
                 anchor_names[anchor.name] = anchor
-            if anchor.source.name in source_names:
+            if anchor.source.name in source_names and (anchor.source is not source_names[anchor.source.name]):
                 raise RuntimeError(f"Source name should be unique but there are duplicate source names in your source "
                                    f"definitions. Source name of {anchor.source} is already defined in {source_names[anchor.source.name]}")
             else:

From 4f76e19cdbb2472423c93e44d0c3c843b9765e57 Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Wed, 12 Oct 2022 10:55:15 +0800
Subject: [PATCH 09/68] Remove unused credentials and deprecated purview
 settings (#708)

* Remove unused credentials and deprecated purview settings
---
 docs/how-to-guides/azure-deployment-cli.md            |  1 -
 docs/how-to-guides/feathr-configuration-and-env.md    |  6 +++---
 docs/quickstart_synapse.md                            |  6 ------
 docs/samples/customer360/Customer360.ipynb            | 11 +----------
 .../databricks_quickstart_nyc_taxi_driver.ipynb       |  8 +-------
 docs/samples/product_recommendation_demo.ipynb        |  2 +-
 .../product_recommendation_demo_advanced.ipynb        |  2 +-
 7 files changed, 7 insertions(+), 29 deletions(-)

diff --git a/docs/how-to-guides/azure-deployment-cli.md b/docs/how-to-guides/azure-deployment-cli.md
index 3762f7b3f..70067b148 100644
--- a/docs/how-to-guides/azure-deployment-cli.md
+++ b/docs/how-to-guides/azure-deployment-cli.md
@@ -117,7 +117,6 @@ echo "AZURE_TENANT_ID: $sp_tenantid"
 echo "AZURE_CLIENT_SECRET: $sp_password"
 This will give three variables: AZURE_CLIENT_ID, AZURE_TENANT_ID and AZURE_CLIENT_SECRET. You will need them later.
 ```
-
 Note: **You should save AZURE_CLIENT_SECRET because you will only see it once here**
 
 ## Create a storage account
diff --git a/docs/how-to-guides/feathr-configuration-and-env.md b/docs/how-to-guides/feathr-configuration-and-env.md
index fd32fb2f6..e4d393a43 100644
--- a/docs/how-to-guides/feathr-configuration-and-env.md
+++ b/docs/how-to-guides/feathr-configuration-and-env.md
@@ -77,9 +77,9 @@ Feathr will get the configurations in the following order:
 | ONLINE_STORE__REDIS__SSL_ENABLED                      | Whether SSL is enabled to access Redis cluster.                                                                                                                                                                                                                                    | Required if using Redis as online store.                                  |
 | REDIS_PASSWORD                                        | Password for the Redis cluster.                                                                                                                                                                                                                                                    | Required if using Redis as online store.                                  |
 | FEATURE_REGISTRY__API_ENDPOINT                        | Specifies registry endpoint.                                                                                                                                                                                                                                                       | Required if using registry service.                                       |
-| FEATURE_REGISTRY__PURVIEW__PURVIEW_NAME               | Configure the name of the purview endpoint.                                                                                                                                                                                                                                        | Required if using Purview directly without registry service. Deprecate soon, see [here](#deprecation) for more details.|
-| FEATURE_REGISTRY__PURVIEW__DELIMITER                  | See [here](#FEATURE_REGISTRY__PURVIEW__DELIMITER) for more details.                                                                                                                                                                                                                | Required if using Purview directly without registry service. Deprecate soon, see [here](#deprecation) for more details.|
-| FEATURE_REGISTRY__PURVIEW__TYPE_SYSTEM_INITIALIZATION | Controls whether the type system (think this as the "schema" for the registry) will be initialized or not. Usually this is only required to be set to `True` to initialize schema, and then you can set it to `False` to shorten the initialization time.                          | Required if using Purview directly without registry service. Deprecate soon, see [here](#deprecation) for more details.|
+| FEATURE_REGISTRY__PURVIEW__PURVIEW_NAME  (Deprecated Soon)             | Configure the name of the purview endpoint.                                                                                                                                                                                                                                        | Required if using Purview directly without registry service. Deprecate soon, see [here](#deprecation) for more details.|
+| FEATURE_REGISTRY__PURVIEW__DELIMITER  (Deprecated Soon)           | See [here](#FEATURE_REGISTRY__PURVIEW__DELIMITER) for more details.                                                                                                                                                                                                                | Required if using Purview directly without registry service. Deprecate soon, see [here](#deprecation) for more details.|
+| FEATURE_REGISTRY__PURVIEW__TYPE_SYSTEM_INITIALIZATION (Deprecated Soon)| Controls whether the type system (think this as the "schema" for the registry) will be initialized or not. Usually this is only required to be set to `True` to initialize schema, and then you can set it to `False` to shorten the initialization time.                          | Required if using Purview directly without registry service. Deprecate soon, see [here](#deprecation) for more details.|
 
 # Explanation for selected configurations
 
diff --git a/docs/quickstart_synapse.md b/docs/quickstart_synapse.md
index 5dee17931..0a66a96bb 100644
--- a/docs/quickstart_synapse.md
+++ b/docs/quickstart_synapse.md
@@ -61,9 +61,6 @@ project_config:
     # Redis password for your online store
     - "REDIS_PASSWORD"
     # Client IDs and Client Secret for the service principal. Read the getting started docs on how to get those information.
-    - "AZURE_CLIENT_ID"
-    - "AZURE_TENANT_ID"
-    - "AZURE_CLIENT_SECRET"
 
 offline_store:
 ---
@@ -98,9 +95,6 @@ These values can also be retrieved by using cloud key value store, such as [Azur
 ```python
 import os
 os.environ['REDIS_PASSWORD'] = ''
-os.environ['AZURE_CLIENT_ID'] = ''
-os.environ['AZURE_TENANT_ID'] = ''
-os.environ['AZURE_CLIENT_SECRET'] = ''
 ```
 
 Please refer to [A note on using azure key vault to store credentials](https://github.com/feathr-ai/feathr/blob/41e7496b38c43af6d7f8f1de842f657b27840f6d/docs/how-to-guides/feathr-configuration-and-env.md#a-note-on-using-azure-key-vault-to-store-credentials) for more details.
diff --git a/docs/samples/customer360/Customer360.ipynb b/docs/samples/customer360/Customer360.ipynb
index 4b202e13a..db042011b 100644
--- a/docs/samples/customer360/Customer360.ipynb
+++ b/docs/samples/customer360/Customer360.ipynb
@@ -192,9 +192,6 @@
             "  project_name: 'customer360'\n",
             "  required_environment_variables:\n",
             "    - 'REDIS_PASSWORD'\n",
-            "    - 'AZURE_CLIENT_ID'\n",
-            "    - 'AZURE_TENANT_ID'\n",
-            "    - 'AZURE_CLIENT_SECRET'\n",
             "    - 'ADLS_ACCOUNT'\n",
             "    - 'ADLS_KEY'\n",
             "    - 'WASB_ACCOUNT'\n",
@@ -239,10 +236,7 @@
             "    port: 6380\n",
             "    ssl_enabled: True\n",
             "feature_registry:\n",
-            "  purview:\n",
-            "    type_system_initialization: true\n",
-            "    purview_name: '<replace_with_your_purview>'\n",
-            "    delimiter: '__'\n",
+            "  api_endpoint: \"https://<replace_with_your_api_endpoint>.azurewebsites.net/api/v1\"\n",
             "\"\"\"\n",
             "# write this configuration string to a temporary location and load it to Feathr\n",
             "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
@@ -331,9 +325,6 @@
          "source": [
             "import os\n",
             "os.environ['REDIS_PASSWORD'] = ''\n",
-            "os.environ['AZURE_CLIENT_ID'] = ''\n",
-            "os.environ['AZURE_TENANT_ID'] = ''\n",
-            "os.environ['AZURE_CLIENT_SECRET'] = ''\n",
             "os.environ['ADLS_ACCOUNT'] = ''\n",
             "os.environ['ADLS_KEY'] = ''\n",
             "os.environ['WASB_ACCOUNT'] = \"\"\n",
diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
index 82aaf3832..52790f884 100644
--- a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
+++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
@@ -332,9 +332,6 @@
         "  project_name: 'feathr_getting_started2'\n",
         "  required_environment_variables:\n",
         "    - 'REDIS_PASSWORD'\n",
-        "    - 'AZURE_CLIENT_ID'\n",
-        "    - 'AZURE_TENANT_ID'\n",
-        "    - 'AZURE_CLIENT_SECRET'\n",
         "offline_store:\n",
         "  adls:\n",
         "    adls_enabled: true\n",
@@ -364,10 +361,7 @@
         "    port: 6380\n",
         "    ssl_enabled: True\n",
         "feature_registry:\n",
-        "  purview:\n",
-        "    type_system_initialization: true\n",
-        "    purview_name: '<replace_with_your_purview>'\n",
-        "    delimiter: '__'\n",
+        "  api_endpoint: \"https://<replace_with_your_api_endpoint>.azurewebsites.net/api/v1\"\n",
         "\"\"\"\n",
         "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
         "with open(tmp.name, \"w\") as text_file:\n",
diff --git a/docs/samples/product_recommendation_demo.ipynb b/docs/samples/product_recommendation_demo.ipynb
index 8636bb992..9ae3ee34d 100644
--- a/docs/samples/product_recommendation_demo.ipynb
+++ b/docs/samples/product_recommendation_demo.ipynb
@@ -260,7 +260,7 @@
         "\n",
         "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
         "\n",
-        "To run this notebook, for Azure users, you need AZURE_CLIENT_ID, AZURE_TENANT_ID, AZURE_CLIENT_SECRET and REDIS_PASSWORD.\n",
+        "To run this notebook, for Azure users, you need REDIS_PASSWORD.\n",
         "To run this notebook, for Databricks useres, you need DATABRICKS_WORKSPACE_TOKEN_VALUE and REDIS_PASSWORD."
       ]
     },
diff --git a/docs/samples/product_recommendation_demo_advanced.ipynb b/docs/samples/product_recommendation_demo_advanced.ipynb
index de3eb2654..e4c5917a5 100644
--- a/docs/samples/product_recommendation_demo_advanced.ipynb
+++ b/docs/samples/product_recommendation_demo_advanced.ipynb
@@ -389,7 +389,7 @@
             "\n",
             "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
             "\n",
-            "To run this notebook, for Azure users, you need AZURE_CLIENT_ID, AZURE_TENANT_ID, AZURE_CLIENT_SECRET and REDIS_PASSWORD.\n",
+            "To run this notebook, for Azure users, you need REDIS_PASSWORD.\n",
             "To run this notebook, for Databricks useres, you need DATABRICKS_WORKSPACE_TOKEN_VALUE and REDIS_PASSWORD."
          ]
       },

From 18d776d3a35edd23e1d8db2bd643c5d88bb09f5f Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Wed, 12 Oct 2022 11:11:39 +0800
Subject: [PATCH 10/68] Revoke token submitted by mistaken (#730)

---
 .../test_user_workspace/feathr_config_registry_purview.yaml     | 2 +-
 .../feathr_config_registry_purview_rbac.yaml                    | 2 +-
 .../test/test_user_workspace/feathr_config_registry_sql.yaml    | 2 +-
 .../test_user_workspace/feathr_config_registry_sql_rbac.yaml    | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
index afe923163..f716da0b4 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
@@ -28,7 +28,7 @@ spark_config:
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
-    workspace_token_value: 'dapid8ddd83000dc2863763b7d47f0e8f3db'
+    workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
index fb88972f7..c842bc702 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
@@ -28,7 +28,7 @@ spark_config:
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
-    workspace_token_value: 'dapid8ddd83000dc2863763b7d47f0e8f3db'
+    workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
index 486eed1e4..dcb73d827 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
@@ -28,7 +28,7 @@ spark_config:
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
-    workspace_token_value: 'dapid8ddd83000dc2863763b7d47f0e8f3db'
+    workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
index 4ad7d35db..29c6889e8 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
@@ -28,7 +28,7 @@ spark_config:
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
-    workspace_token_value: 'dapid8ddd83000dc2863763b7d47f0e8f3db'
+    workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
     feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"

From 9f446bf287387ee20effc1cb7e9b39869f7451e8 Mon Sep 17 00:00:00 2001
From: Hangfei Lin <hnlin@linkedin.com>
Date: Tue, 11 Oct 2022 20:35:32 -0700
Subject: [PATCH 11/68] Update product_recommendation_demo.ipynb

---
 docs/samples/product_recommendation_demo.ipynb | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/docs/samples/product_recommendation_demo.ipynb b/docs/samples/product_recommendation_demo.ipynb
index 9ae3ee34d..44febb062 100644
--- a/docs/samples/product_recommendation_demo.ipynb
+++ b/docs/samples/product_recommendation_demo.ipynb
@@ -21,10 +21,10 @@
         "\n",
         "First step is to provision required cloud resources if you want to use Feathr. Feathr provides a python based client to interact with cloud resources.\n",
         "\n",
-        "Please follow the steps [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to provision required cloud resources. Due to the complexity of the possible cloud environment, it is almost impossible to create a script that works for all the use cases. Because of this, [azure_resource_provision.sh](https://github.com/linkedin/feathr/blob/main/docs/how-to-guides/azure_resource_provision.sh) is a full end to end command line to create all the required resources, and you can tailor the script as needed, while [the companion documentation](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) can be used as a complete guide for using that shell script. \n",
+        "Please follow the steps [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to provision required cloud resources. Due to the complexity of the possible cloud environment, it is almost impossible to create a script that works for all the use cases. Because of this, [azure_resource_provision.sh](https://github.com/feathr-ai/feathr/blob/main/docs/how-to-guides/azure_resource_provision.sh) is a full end to end command line to create all the required resources, and you can tailor the script as needed, while [the companion documentation](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) can be used as a complete guide for using that shell script. \n",
         "\n",
         "\n",
-        "![Architecture](https://github.com/linkedin/feathr/blob/main/docs/images/architecture.png?raw=true)"
+        "![Architecture](https://github.com/feathr-ai/feathr/blob/main/docs/images/architecture.png?raw=true)"
       ]
     },
     {
@@ -190,7 +190,7 @@
         "\n",
         "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. If you use Feathr CLI to create a workspace, you should have a folder with a file called `feathr_config.yaml` in it with all the required configurations. Otherwise, update the configuration below.\n",
         "\n",
-        "The code below will write this configuration string to a temporary location and load it to Feathr. Please still refer to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It should also have more explanations on the meaning of each variable."
+        "The code below will write this configuration string to a temporary location and load it to Feathr. Please still refer to [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It should also have more explanations on the meaning of each variable."
       ]
     },
     {
@@ -201,7 +201,7 @@
       "source": [
         "import tempfile\n",
         "yaml_config = \"\"\"\n",
-        "# Please refer to https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
+        "# Please refer to https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
         "api_version: 1\n",
         "project_config:\n",
         "  project_name: 'feathr_getting_started'\n",
@@ -258,7 +258,7 @@
       "source": [
         "## Prerequisite: Setup necessary environment variables (Skip this step if using the above Quick Start Template)\n",
         "\n",
-        "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
+        "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
         "\n",
         "To run this notebook, for Azure users, you need REDIS_PASSWORD.\n",
         "To run this notebook, for Databricks useres, you need DATABRICKS_WORKSPACE_TOKEN_VALUE and REDIS_PASSWORD."
@@ -339,7 +339,7 @@
         " After a bit of data exploration, we want to create a training dataset like this:\n",
         "\n",
         " \n",
-        "![Feature Flow](https://github.com/linkedin/feathr/blob/main/docs/images/product_recommendation.jpg?raw=true)"
+        "![Feature Flow](https://github.com/feathr-ai/feathr/blob/main/docs/images/product_recommendation.jpg?raw=true)"
       ]
     },
     {
@@ -360,7 +360,7 @@
         "1. Feature source: what source data that this feature is based on\n",
         "2. Transformation: what transformation is used to transform the source data into feature. Transformation can be optional when you just want to take a column out from the source data.\n",
         "\n",
-        "(For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/linkedin/feathr/blob/main/docs/concepts/feature-definition.md))"
+        "(For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md))"
       ]
     },
     {
@@ -569,7 +569,7 @@
         "To create a training dataset using Feathr, we need to provide a feature join settings to specify\n",
         "what features and how these features should be joined to the observation data. \n",
         "\n",
-        "(To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md))"
+        "(To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/point-in-time-join.md))"
       ]
     },
     {
@@ -701,7 +701,7 @@
         "![img](../images/online_inference.jpg)\n",
         "\n",
         "\n",
-        "In this section, we will focus on materialize features to online store. For materialization to offline store, you can check out our [user guide](https://github.com/linkedin/feathr/blob/main/docs/concepts/materializing-features.md#materializing-features-to-offline-store).\n",
+        "In this section, we will focus on materialize features to online store. For materialization to offline store, you can check out our [user guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/materializing-features.md#materializing-features-to-offline-store).\n",
         "\n",
         "We can push the computed features to the online store like below:"
       ]

From 39c14ca77e629adf111778ae70c720084d38f5ef Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Wed, 12 Oct 2022 23:02:44 +0800
Subject: [PATCH 12/68] Fix synapse errors not print out issue (#734)

Co-authored-by: enya-yx <enya@v-ellinlu-2.fareast.corp.microsoft.com>
---
 feathr_project/feathr/spark_provider/_synapse_submission.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/feathr_project/feathr/spark_provider/_synapse_submission.py b/feathr_project/feathr/spark_provider/_synapse_submission.py
index b72acdc42..010444715 100644
--- a/feathr_project/feathr/spark_provider/_synapse_submission.py
+++ b/feathr_project/feathr/spark_provider/_synapse_submission.py
@@ -325,7 +325,7 @@ def create_spark_batch_job(self, job_name, main_file, class_name=None,
     def get_driver_log(self, job_id) -> str:
         # @see: https://docs.microsoft.com/en-us/azure/synapse-analytics/spark/connect-monitor-azure-synapse-spark-application-level-metrics
         app_id = self.get_spark_batch_job(job_id).app_id
-        url = "%s/sparkhistory/api/v1/sparkpools/%s/livyid/%s/applications/%s/driverlog/stdout/?isDownload=true" % (self._synapse_dev_url, self._spark_pool_name, job_id, app_id)
+        url = "%s/sparkhistory/api/v1/sparkpools/%s/livyid/%s/applications/%s/driverlog/stderr/?isDownload=true" % (self._synapse_dev_url, self._spark_pool_name, job_id, app_id)
         token = self._credential.get_token("https://dev.azuresynapse.net/.default").token
         req = urllib.request.Request(url=url, headers={"authorization": "Bearer %s" % token})
         resp = urllib.request.urlopen(req)

From c075dc2d89a0ade329ea07e759decdd8a021d242 Mon Sep 17 00:00:00 2001
From: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
Date: Wed, 12 Oct 2022 10:28:03 -0700
Subject: [PATCH 13/68] Spark config passing bug fix for local spark submission
 (#729)

* Fix local spark output file-format bug

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

* Add dev dependencies. Add unit-test for local spark job launcher

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

* Fix local spark submission unused param error

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
---
 feathr_project/feathr/client.py               |  53 +++--
 feathr_project/feathr/spark_provider/_abc.py  |   4 +-
 .../spark_provider/_localspark_submission.py  | 197 +++++++++---------
 feathr_project/pyproject.toml                 |  13 +-
 feathr_project/setup.py                       |  14 +-
 .../test_localspark_submission.py             |  51 +++++
 6 files changed, 204 insertions(+), 128 deletions(-)
 create mode 100644 feathr_project/test/unit/spark_provider/test_localspark_submission.py

diff --git a/feathr_project/feathr/client.py b/feathr_project/feathr/client.py
index 759a33365..1f77d61e0 100644
--- a/feathr_project/feathr/client.py
+++ b/feathr_project/feathr/client.py
@@ -1,39 +1,36 @@
 import base64
+import copy
 import logging
 import os
 import tempfile
 from typing import Dict, List, Union
-from feathr.definition.feature import FeatureBase
-import copy
 
-import redis
 from azure.identity import DefaultAzureCredential
 from jinja2 import Template
 from pyhocon import ConfigFactory
-from feathr.definition.sink import Sink
-from feathr.registry.feature_registry import default_registry_client
-
-from feathr.spark_provider._databricks_submission import _FeathrDatabricksJobLauncher
-from feathr.spark_provider._synapse_submission import _FeathrSynapseJobLauncher
-from feathr.spark_provider._localspark_submission import _FeathrDLocalSparkJobLauncher
+import redis
 
-from feathr.definition._materialization_utils import _to_materialization_config
-from feathr.udf._preprocessing_pyudf_manager import _PreprocessingPyudfManager
 from feathr.constants import *
-from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration
+from feathr.definition._materialization_utils import _to_materialization_config
+from feathr.definition.anchor import FeatureAnchor
+from feathr.definition.feature import FeatureBase
 from feathr.definition.feature_derivations import DerivedFeature
 from feathr.definition.materialization_settings import MaterializationSettings
 from feathr.definition.monitoring_settings import MonitoringSettings
-from feathr.protobuf.featureValue_pb2 import FeatureValue
 from feathr.definition.query_feature_list import FeatureQuery
 from feathr.definition.settings import ObservationSettings
-from feathr.definition.feature_derivations import DerivedFeature
-from feathr.definition.anchor import FeatureAnchor
+from feathr.definition.sink import Sink
+from feathr.protobuf.featureValue_pb2 import FeatureValue
+from feathr.registry.feature_registry import default_registry_client
+from feathr.spark_provider._databricks_submission import _FeathrDatabricksJobLauncher
+from feathr.spark_provider._localspark_submission import _FeathrLocalSparkJobLauncher
+from feathr.spark_provider._synapse_submission import _FeathrSynapseJobLauncher
 from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration
+from feathr.udf._preprocessing_pyudf_manager import _PreprocessingPyudfManager
 from feathr.utils._envvariableutil import _EnvVaraibleUtil
 from feathr.utils._file_utils import write_to_file
 from feathr.utils.feature_printer import FeaturePrinter
-from feathr.utils.spark_job_params import FeatureJoinJobParams, FeatureGenerationJobParams
+from feathr.utils.spark_job_params import FeatureGenerationJobParams, FeatureJoinJobParams
 
 
 class FeathrClient(object):
@@ -161,7 +158,7 @@ def __init__(self, config_path:str = "./feathr_config.yaml", local_workspace_dir
             self._FEATHR_JOB_JAR_PATH = \
                 self.envutils.get_environment_variable_with_default(
                     'spark_config', 'local', 'feathr_runtime_location')
-            self.feathr_spark_launcher = _FeathrDLocalSparkJobLauncher(
+            self.feathr_spark_launcher = _FeathrLocalSparkJobLauncher(
                 workspace_path = self.envutils.get_environment_variable_with_default('spark_config', 'local', 'workspace'),
                 master = self.envutils.get_environment_variable_with_default('spark_config', 'local', 'master')
                 )
@@ -354,7 +351,7 @@ def _decode_proto(self, feature_list):
             else:
                 typed_result.append(raw_feature)
         return typed_result
-    
+
     def delete_feature_from_redis(self, feature_table, key, feature_name) -> None:
         """
         Delete feature from Redis
@@ -364,7 +361,7 @@ def delete_feature_from_redis(self, feature_table, key, feature_name) -> None:
             key: the key of the entity
             feature_name: feature name to be deleted
         """
-        
+
         redis_key = self._construct_redis_key(feature_table, key)
         if self.redis_client.hexists(redis_key, feature_name):
             self.redis_client.delete(redis_key, feature_name)
@@ -575,20 +572,20 @@ def monitor_features(self, settings: MonitoringSettings, execution_configuration
     def _get_feature_key(self, feature_name: str):
         features = []
         if 'derived_feature_list' in dir(self):
-            features += self.derived_feature_list 
+            features += self.derived_feature_list
         if 'anchor_list' in dir(self):
             for anchor in self.anchor_list:
-                features += anchor.features  
+                features += anchor.features
         for feature in features:
             if feature.name == feature_name:
                 keys = feature.key
-                return set(key.key_column for key in keys) 
+                return set(key.key_column for key in keys)
         self.logger.warning(f"Invalid feature name: {feature_name}. Please call FeathrClient.build_features() first in order to materialize the features.")
         return None
-        
+
     # Validation on feature keys:
     # Features within a set of aggregation or planned to be merged should have same keys
-    # The param "allow_empty_key" shows if empty keys are acceptable 
+    # The param "allow_empty_key" shows if empty keys are acceptable
     def _valid_materialize_keys(self, features: List[str], allow_empty_key=False):
         keys = None
         for feature in features:
@@ -611,7 +608,7 @@ def _valid_materialize_keys(self, features: List[str], allow_empty_key=False):
                         self.logger.error(f"Inconsistent feature keys. Current keys are {str(keys)}")
                         return False
         return True
-    
+
     def materialize_features(self, settings: MaterializationSettings, execution_configurations: Union[SparkExecutionConfiguration ,Dict[str,str]] = {}, verbose: bool = False):
         """Materialize feature data
 
@@ -622,7 +619,7 @@ def materialize_features(self, settings: MaterializationSettings, execution_conf
         feature_list = settings.feature_names
         if len(feature_list) > 0 and not self._valid_materialize_keys(feature_list):
             raise RuntimeError(f"Invalid materialization features: {feature_list}, since they have different keys. Currently Feathr only supports materializing features of the same keys.")
-        
+
         # Collect secrets from sinks
         secrets = []
         for sink in settings.sinks:
@@ -632,7 +629,7 @@ def materialize_features(self, settings: MaterializationSettings, execution_conf
         # produce materialization config
         for end in settings.get_backfill_cutoff_time():
             settings.backfill_time.end = end
-            config = _to_materialization_config(settings)         
+            config = _to_materialization_config(settings)
             config_file_name = "feature_gen_conf/auto_gen_config_{}.conf".format(end.timestamp())
             config_file_path = os.path.join(self.local_workspace_dir, config_file_name)
             write_to_file(content=config, full_file_name=config_file_path)
@@ -854,7 +851,7 @@ def get_features_from_registry(self, project_name: str) -> Dict[str, FeatureBase
                 feature_dict[feature.name] = feature
         for feature in registry_derived_feature_list:
                 feature_dict[feature.name] = feature
-        return feature_dict 
+        return feature_dict
 
     def _reshape_config_str(self, config_str:str):
         if self.spark_runtime == 'local':
diff --git a/feathr_project/feathr/spark_provider/_abc.py b/feathr_project/feathr/spark_provider/_abc.py
index 2644f82fe..c91fdf5c1 100644
--- a/feathr_project/feathr/spark_provider/_abc.py
+++ b/feathr_project/feathr/spark_provider/_abc.py
@@ -1,6 +1,6 @@
 from abc import ABC, abstractmethod
+from typing import Dict, List, Optional, Tuple
 
-from typing import Any, Dict, List, Optional, Tuple
 
 class SparkJobLauncher(ABC):
     """This is the abstract class for all the spark launchers. All the Spark launcher should implement those interfaces
@@ -15,7 +15,6 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
         """
         pass
 
-
     @abstractmethod
     def submit_feathr_job(self, job_name: str, main_jar_path: str,  main_class_name: str, arguments: List[str],
                           reference_files_path: List[str], job_tags: Dict[str, str] = None,
@@ -33,6 +32,7 @@ def submit_feathr_job(self, job_name: str, main_jar_path: str,  main_class_name:
             properties (Dict[str, str]): Additional System Properties for the spark job
         """
         pass
+
     @abstractmethod
     def wait_for_completion(self, timeout_seconds: Optional[float]) -> bool:
         """Returns true if the job completed successfully
diff --git a/feathr_project/feathr/spark_provider/_localspark_submission.py b/feathr_project/feathr/spark_provider/_localspark_submission.py
index 3b24fd513..afed9683d 100644
--- a/feathr_project/feathr/spark_provider/_localspark_submission.py
+++ b/feathr_project/feathr/spark_provider/_localspark_submission.py
@@ -1,129 +1,125 @@
-import time
 from datetime import datetime
 import json
 import os
 from pathlib import Path
-from typing import Dict, List, Optional
+from shlex import split
+from subprocess import STDOUT, Popen
+import time
+from typing import Any, Dict, List, Optional
 
-from feathr.spark_provider._abc import SparkJobLauncher
 from loguru import logger
-
 from pyspark import *
 
-from subprocess import TimeoutExpired, STDOUT, Popen
-from shlex import split
 from feathr.constants import FEATHR_MAVEN_ARTIFACT
+from feathr.spark_provider._abc import SparkJobLauncher
 
 
+class _FeathrLocalSparkJobLauncher(SparkJobLauncher):
+    """Class to interact with local Spark. This class is not intended to be used in Production environments.
+    It is intended to be used for testing and development purposes. No authentication is required to use this class.
 
-class _FeathrDLocalSparkJobLauncher(SparkJobLauncher):
-    """Class to interact with local Spark
-        This class is not intended to be used in Production environments.
-        It is intended to be used for testing and development purposes.
-        No authentication is required to use this class.
-        Args:
-            workspace_path (str): Path to the workspace
+    Args:
+        workspace_path (str): Path to the workspace
     """
+
     def __init__(
         self,
         workspace_path: str,
         master: str = None,
-        debug_folder:str = "debug",
-        clean_up:bool = True,
-        retry:int = 3,
-        retry_sec:int = 5,
+        debug_folder: str = "debug",
+        clean_up: bool = True,
+        retry: int = 3,
+        retry_sec: int = 5,
     ):
-        """Initialize the Local Spark job launcher
-        """
-        self.workspace_path = workspace_path,
+        """Initialize the Local Spark job launcher"""
+        self.workspace_path = (workspace_path,)
         self.debug_folder = debug_folder
         self.spark_job_num = 0
         self.clean_up = clean_up
         self.retry = retry
         self.retry_sec = retry_sec
         self.packages = self._get_default_package()
-        self.master = master
+        self.master = master or "local[*]"
 
     def upload_or_get_cloud_path(self, local_path_or_http_path: str):
         """For Local Spark Case, no need to upload to cloud workspace."""
         return local_path_or_http_path
 
-    def submit_feathr_job(self, job_name: str, main_jar_path: str = None,  main_class_name: str = None, arguments: List[str] = None,
-                          python_files: List[str]= None, configuration: Dict[str, str] = {}, properties: Dict[str, str] = {}, reference_files_path: List[str] = None, job_tags: Dict[str, str] = None):
-        """
-        Submits the Feathr job to local spark, using subprocess args.
-
-        reference files: put everything there and the function will automatically categorize them based on the
-        extension name to either the "files" argument in the Livy API, or the "jars" argument in the Livy API. The
-        path can be local path and this function will automatically upload the function to the corresponding azure
-        storage
-
-        Also, note that the Spark application will automatically run on YARN cluster mode. You cannot change it if
+    def submit_feathr_job(
+        self,
+        job_name: str,
+        main_jar_path: str,
+        main_class_name: str,
+        arguments: List[str] = None,
+        python_files: List[str] = None,
+        configuration: Dict[str, str] = {},
+        properties: Dict[str, str] = {},
+        **_,
+    ) -> Any:
+        """Submits the Feathr job to local spark, using subprocess args.
+        Note that the Spark application will automatically run on YARN cluster mode. You cannot change it if
         you are running with Azure Synapse.
 
         Args:
-            job_name (str): name of the job
-            main_jar_path (str): main file paths, usually your main jar file
-            main_class_name (str): name of your main class
-            arguments (str): all the arguments you want to pass into the spark job
-            configuration (Dict[str, str]): Additional configs for the spark job
-            python_files (List[str]): required .zip, .egg, or .py files of spark job
-            properties (Dict[str, str]): Additional System Properties for the spark job
-            job_tags (str): not used in local spark mode
-            reference_files_path (str): not used in local spark mode
+            job_name: name of the job
+            main_jar_path: main file paths, usually your main jar file
+            main_class_name: name of your main class
+            arguments: all the arguments you want to pass into the spark job
+            python_files: required .zip, .egg, or .py files of spark job
+            configuration: Additional configs for the spark job
+            properties: System properties configuration
+            **_: Not used arguments in local spark mode, such as reference_files_path and job_tags
         """
-        logger.warning(f"Local Spark Mode only support basic params right now and should be used only for testing purpose.")
-        self.cmd_file, self.log_path = self._get_debug_file_name(self.debug_folder, prefix = job_name)
-        args = self._init_args(master = self.master, job_name=job_name)
+        logger.warning(
+            f"Local Spark Mode only support basic params right now and should be used only for testing purpose."
+        )
+        self.cmd_file, self.log_path = self._get_debug_file_name(self.debug_folder, prefix=job_name)
 
-        if properties:
-            arguments.extend(["--system-properties", json.dumps(properties)])
+        # Get conf and package arguments
+        cfg = configuration.copy() if configuration else {}
+        maven_dependency = f"{cfg.pop('spark.jars.packages', self.packages)},{FEATHR_MAVEN_ARTIFACT}"
+        spark_args = self._init_args(job_name=job_name, confs=cfg)
 
-        if configuration:
-            cfg = configuration.copy()  # We don't want to mess up input parameters
-        else:
-            cfg = {}
-        
         if not main_jar_path:
             # We don't have the main jar, use Maven
-            # Add Maven dependency to the job configuration
-            if "spark.jars.packages" in cfg:
-                cfg["spark.jars.packages"] = ",".join(
-                    [cfg["spark.jars.packages"], FEATHR_MAVEN_ARTIFACT])
-            else:
-                cfg["spark.jars.packages"] = ",".join([self.packages, FEATHR_MAVEN_ARTIFACT])
-
             if not python_files:
                 # This is a JAR job
                 # Azure Synapse/Livy doesn't allow JAR job starts from Maven directly, we must have a jar file uploaded.
                 # so we have to use a dummy jar as the main file.
                 logger.info(f"Main JAR file is not set, using default package '{FEATHR_MAVEN_ARTIFACT}' from Maven")
                 # Use the no-op jar as the main file
-                # This is a dummy jar which contains only one `org.example.Noop` class with one empty `main` function which does nothing
+                # This is a dummy jar which contains only one `org.example.Noop` class with one empty `main` function
+                # which does nothing
                 current_dir = Path(__file__).parent.resolve()
                 main_jar_path = os.path.join(current_dir, "noop-1.0.jar")
-                args.extend(["--packages", cfg["spark.jars.packages"],"--class", main_class_name, main_jar_path])
+                spark_args.extend(["--packages", maven_dependency, "--class", main_class_name, main_jar_path])
             else:
-                args.extend(["--packages", cfg["spark.jars.packages"]])
-                # This is a PySpark job, no more things to 
+                spark_args.extend(["--packages", maven_dependency])
+                # This is a PySpark job, no more things to
                 if python_files.__len__() > 1:
-                    args.extend(["--py-files", ",".join(python_files[1:])])
+                    spark_args.extend(["--py-files", ",".join(python_files[1:])])
                 print(python_files)
-                args.append(python_files[0])
+                spark_args.append(python_files[0])
         else:
-            args.extend(["--class", main_class_name, main_jar_path])
+            spark_args.extend(["--class", main_class_name, main_jar_path])
+
+        if arguments:
+            spark_args.extend(arguments)
 
-        cmd = " ".join(args) + " " + " ".join(arguments)
+        if properties:
+            spark_args.extend(["--system-properties", json.dumps(properties)])
+
+        cmd = " ".join(spark_args)
 
-        log_append = open(f"{self.log_path}_{self.spark_job_num}.txt" , "a")     
+        log_append = open(f"{self.log_path}_{self.spark_job_num}.txt", "a")
         proc = Popen(split(cmd), shell=False, stdout=log_append, stderr=STDOUT)
         logger.info(f"Detail job stdout and stderr are in {self.log_path}.")
 
         self.spark_job_num += 1
 
         with open(self.cmd_file, "a") as c:
-                c.write(" ".join(proc.args))
-                c.write("\n")
+            c.write(" ".join(proc.args))
+            c.write("\n")
 
         self.latest_spark_proc = proc
 
@@ -132,9 +128,8 @@ def submit_feathr_job(self, job_name: str, main_jar_path: str = None,  main_clas
         return proc
 
     def wait_for_completion(self, timeout_seconds: Optional[float] = 500) -> bool:
-        """
-        this function track local spark job commands and process status.
-        files will be write into `debug` folder under your workspace.
+        """This function track local spark job commands and process status.
+        Files will be write into `debug` folder under your workspace.
         """
         logger.info(f"{self.spark_job_num} local spark job(s) in this Launcher, only the latest will be monitored.")
         logger.info(f"Please check auto generated spark command in {self.cmd_file} and detail logs in {self.log_path}.")
@@ -143,12 +138,15 @@ def wait_for_completion(self, timeout_seconds: Optional[float] = 500) -> bool:
         start_time = time.time()
         retry = self.retry
 
-        log_read = open(f"{self.log_path}_{self.spark_job_num-1}.txt" , "r") 
+        log_read = open(f"{self.log_path}_{self.spark_job_num-1}.txt", "r")
         while proc.poll() is None and (((timeout_seconds is None) or (time.time() - start_time < timeout_seconds))):
             time.sleep(1)
             try:
                 if retry < 1:
-                    logger.warning(f"Spark job has hang for {self.retry * self.retry_sec} seconds. latest msg is {last_line}. please check {log_read.name}")
+                    logger.warning(
+                        f"Spark job has hang for {self.retry * self.retry_sec} seconds. latest msg is {last_line}. \
+                            Please check {log_read.name}"
+                    )
                     if self.clean_up:
                         self._clean_up()
                         proc.wait()
@@ -168,22 +166,28 @@ def wait_for_completion(self, timeout_seconds: Optional[float] = 500) -> bool:
                 retry -= 1
 
         job_duration = time.time() - start_time
-        log_read.close() 
+        log_read.close()
 
         if proc.returncode == None:
-            logger.warning(f"Spark job with pid {self.latest_spark_proc.pid} not completed after {timeout_seconds} sec time out setting, please check.")
+            logger.warning(
+                f"Spark job with pid {self.latest_spark_proc.pid} not completed after {timeout_seconds} sec \
+                    time out setting. Please check."
+            )
             if self.clean_up:
                 self._clean_up()
                 proc.wait()
                 return True
         elif proc.returncode == 1:
-            logger.warning(f"Spark job with pid {self.latest_spark_proc.pid} is not successful, please check.")
+            logger.warning(f"Spark job with pid {self.latest_spark_proc.pid} is not successful. Please check.")
             return False
         else:
-            logger.info(f"Spark job with pid {self.latest_spark_proc.pid} finished in: {int(job_duration)} seconds with returncode {proc.returncode}")
+            logger.info(
+                f"Spark job with pid {self.latest_spark_proc.pid} finished in: {int(job_duration)} seconds \
+                    with returncode {proc.returncode}"
+            )
             return True
 
-    def _clean_up(self, proc:Popen = None):
+    def _clean_up(self, proc: Popen = None):
         logger.warning(f"Terminate the spark job due to as clean_up is set to True.")
         if not proc:
             self.latest_spark_proc.terminate()
@@ -194,30 +198,35 @@ def get_status(self) -> str:
         """Get the status of the job, only a placeholder for local spark"""
         return self.latest_spark_proc.returncode
 
-    def _init_args(self, master:str, job_name:str):
-        if master is None:
-            master = "local[*]"
-        logger.info(f"Spark job: {job_name} is running on local spark with master: {master}.")
+    def _init_args(self, job_name: str, confs: Dict[str, str]) -> List[str]:
+        logger.info(f"Spark job: {job_name} is running on local spark with master: {self.master}.")
         args = [
             "spark-submit",
-            "--master",master,
-            "--name",job_name,
-            "--conf", "spark.hadoop.fs.wasbs.impl=org.apache.hadoop.fs.azure.NativeAzureFileSystem",
-            "--conf", "spark.hadoop.fs.wasbs=org.apache.hadoop.fs.azure.NativeAzureFileSystem",
+            "--master",
+            self.master,
+            "--name",
+            job_name,
+            "--conf",
+            "spark.hadoop.fs.wasbs.impl=org.apache.hadoop.fs.azure.NativeAzureFileSystem",
+            "--conf",
+            "spark.hadoop.fs.wasbs=org.apache.hadoop.fs.azure.NativeAzureFileSystem",
         ]
+
+        for k, v in confs.items():
+            args.extend(["--conf", f"{k}={v}"])
+
         return args
 
-    def _get_debug_file_name(self, debug_folder: str = "debug", prefix:str = None):
-        """
-        auto generated command will be write into cmd file
-        spark job output will be write into log path with job number as suffix
+    def _get_debug_file_name(self, debug_folder: str = "debug", prefix: str = None):
+        """Auto generated command will be write into cmd file.
+        Spark job output will be write into log path with job number as suffix.
         """
         prefix += datetime.now().strftime("%Y%m%d%H%M%S")
         debug_path = os.path.join(debug_folder, prefix)
 
         print(debug_path)
         if not os.path.exists(debug_path):
-                os.makedirs(debug_path)
+            os.makedirs(debug_path)
 
         cmd_file = os.path.join(debug_path, f"command.sh")
         log_path = os.path.join(debug_path, f"log")
@@ -227,7 +236,7 @@ def _get_debug_file_name(self, debug_folder: str = "debug", prefix:str = None):
     def _get_default_package(self):
         # default packages of Feathr Core, requires manual update when new dependency introduced or package updated.
         # TODO: automate this process, e.g. read from pom.xml
-        # TODO: dynamical modularization: add package only when it's used in the job, e.g. data source dependencies. 
+        # TODO: dynamical modularization: add package only when it's used in the job, e.g. data source dependencies.
         packages = []
         packages.append("org.apache.spark:spark-avro_2.12:3.3.0")
         packages.append("com.microsoft.sqlserver:mssql-jdbc:10.2.0.jre8")
@@ -236,7 +245,7 @@ def _get_default_package(self):
         packages.append("com.fasterxml.jackson.core:jackson-databind:2.12.6.1")
         packages.append("org.apache.hadoop:hadoop-mapreduce-client-core:2.7.7")
         packages.append("org.apache.hadoop:hadoop-common:2.7.7")
-        packages.append("org.apache.hadoop:hadoop-azure:3.2.0") 
+        packages.append("org.apache.hadoop:hadoop-azure:3.2.0")
         packages.append("org.apache.avro:avro:1.8.2,org.apache.xbean:xbean-asm6-shaded:4.10")
         packages.append("org.apache.spark:spark-sql-kafka-0-10_2.12:3.1.3")
         packages.append("com.microsoft.azure:azure-eventhubs-spark_2.12:2.3.21")
diff --git a/feathr_project/pyproject.toml b/feathr_project/pyproject.toml
index f8d897579..693233dc2 100644
--- a/feathr_project/pyproject.toml
+++ b/feathr_project/pyproject.toml
@@ -1,6 +1,17 @@
+[tool.black]
+line-length = 120
+target_version = ['py38']
+
+[tool.isort]
+profile = "black"
+line_length = 120
+known_first_party = ['feathr']
+force_sort_within_sections = true
+multi_line_output = 3
+
 [build-system]
 requires = [
     "setuptools",
     "wheel"
 ]
-build-backend = "setuptools.build_meta"
\ No newline at end of file
+build-backend = "setuptools.build_meta"
diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index e937f19c4..ce7ec14d6 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -20,7 +20,7 @@
     include_package_data=True,
     # consider
     install_requires=[
-        'click<=8.1.3',
+        "click<=8.1.3",
         "py4j<=0.10.9.7",
         "loguru<=0.6.0",
         "pandas<=1.5.0",
@@ -54,9 +54,17 @@
         "azure-core<=1.22.1",
         "typing_extensions>=4.2.0"
     ],
-    tests_require=[
-        'pytest',
+    tests_require=[  # TODO: This has been depricated
+        "pytest",
     ],
+    extras_require=dict(
+        dev=[
+            "black>=22.1.0",    # formatter
+            "isort",            # sort import statements
+            "pytest>=7",
+            "pytest-mock>=3.8.1",
+        ],
+    ),
     entry_points={
         'console_scripts': ['feathr=feathrcli.cli:cli']
     },
diff --git a/feathr_project/test/unit/spark_provider/test_localspark_submission.py b/feathr_project/test/unit/spark_provider/test_localspark_submission.py
new file mode 100644
index 000000000..9a9d7238b
--- /dev/null
+++ b/feathr_project/test/unit/spark_provider/test_localspark_submission.py
@@ -0,0 +1,51 @@
+from typing import Dict
+from unittest.mock import MagicMock
+
+import pytest
+from pytest_mock import MockerFixture
+
+from feathr.spark_provider._localspark_submission import _FeathrLocalSparkJobLauncher
+
+
+@pytest.fixture(scope="function")
+def local_spark_job_launcher(tmp_path) -> _FeathrLocalSparkJobLauncher:
+    return _FeathrLocalSparkJobLauncher(
+        workspace_path=str(tmp_path),
+        debug_folder=str(tmp_path),
+    )
+
+
+def test__local_spark_job_launcher__submit_feathr_job(
+    mocker: MockerFixture,
+    local_spark_job_launcher: _FeathrLocalSparkJobLauncher,
+):
+    # Mock necessary components
+    local_spark_job_launcher._init_args = MagicMock(return_value=[])
+    mocked_proc = MagicMock()
+    mocked_proc.args = []
+    mocked_proc.pid = 0
+
+    mocked_spark_proc = mocker.patch("feathr.spark_provider._localspark_submission.Popen", return_value=mocked_proc)
+
+    local_spark_job_launcher.submit_feathr_job(
+        job_name="unit-test",
+        main_jar_path="",
+        main_class_name="",
+    )
+
+    # Assert if the mocked spark process has called once
+    mocked_spark_proc.assert_called_once()
+
+
+@pytest.mark.parametrize(
+    "confs", [{}, {"spark.feathr.outputFormat": "parquet"}]
+)
+def test__local_spark_job_launcher__init_args(
+    local_spark_job_launcher: _FeathrLocalSparkJobLauncher,
+    confs: Dict[str, str],
+):
+    spark_args = local_spark_job_launcher._init_args(job_name=None, confs=confs)
+
+    # Assert if spark_args contains confs at the end
+    for k, v in confs.items():
+        assert spark_args[-1] == f"{k}={v}"

From d771c3c0574dc6d04a3dc969c0e93ba5283206c4 Mon Sep 17 00:00:00 2001
From: Yihui Guo <yihgu@microsoft.com>
Date: Thu, 13 Oct 2022 22:37:33 +0800
Subject: [PATCH 14/68] Fix direct purview client missing transformation (#736)

---
 .../feathr/registry/_feature_registry_purview.py          | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/feathr_project/feathr/registry/_feature_registry_purview.py b/feathr_project/feathr/registry/_feature_registry_purview.py
index 4ef05a690..c564e8796 100644
--- a/feathr_project/feathr/registry/_feature_registry_purview.py
+++ b/feathr_project/feathr/registry/_feature_registry_purview.py
@@ -1368,11 +1368,11 @@ def _get_transformation_from_dict(self, input: Dict) -> FeatureType:
         if 'transformExpr' in input:
             # it's ExpressionTransformation
             return ExpressionTransformation(input['transformExpr'])
-        elif 'def_expr' in input:
-            agg_expr=input['def_expr'] if 'def_expr' in input else None
-            agg_func=input['agg_func']if 'agg_func' in input else None
+        elif 'def_expr' in input or 'defExpr' in input: 
+            agg_expr=input['def_expr'] if 'def_expr' in input else (input['defExpr'] if 'defExpr' in input else None)
+            agg_func=input['agg_func']if 'agg_func' in input else (input['aggFunc'] if 'aggFunc' in input else None)
             window=input['window']if 'window' in input else None
-            group_by=input['group_by']if 'group_by' in input else None
+            group_by=input['group_by']if 'group_by' in input else (input['groupBy'] if 'groupBy' in input else None)
             filter=input['filter']if 'filter' in input else None
             limit=input['limit']if 'limit' in input else None
             return WindowAggTransformation(agg_expr, agg_func, window, group_by, filter, limit)

From f677a174353530dbd15835d00fe3671d1858bf77 Mon Sep 17 00:00:00 2001
From: Jinghui Mo <jmo@linkedin.com>
Date: Thu, 13 Oct 2022 12:33:22 -0400
Subject: [PATCH 15/68] Revert "Derived feature bugfix (#121)" (#731)

This reverts commit fa645f386002211286b5bfe3f9c72ba987be71cc.
---
 .../feathr/definition/feature_derivations.py           |  2 +-
 feathr_project/test/test_derived_features.py           | 10 +++++-----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/feathr_project/feathr/definition/feature_derivations.py b/feathr_project/feathr/definition/feature_derivations.py
index 84583654f..9205685ce 100644
--- a/feathr_project/feathr/definition/feature_derivations.py
+++ b/feathr_project/feathr/definition/feature_derivations.py
@@ -58,7 +58,7 @@ def to_feature_config(self) -> str:
                         }
                     {% endfor %}
                 }
-                definition: {{derived_feature.transform.to_feature_config(False)}}
+                definition.sqlExpr: {{derived_feature.transform.to_feature_config(False)}}
                 {{derived_feature.feature_type.to_feature_config()}}
             }
         """)
diff --git a/feathr_project/test/test_derived_features.py b/feathr_project/test/test_derived_features.py
index f879553d7..ee10cd285 100644
--- a/feathr_project/test/test_derived_features.py
+++ b/feathr_project/test/test_derived_features.py
@@ -26,7 +26,7 @@ def test_single_key_derived_feature_to_config():
         inputs: {
             user_embedding: {key: [user_id], feature: user_embedding}
         }
-        definition: "if_else(user_embedding, user_embedding, [])"
+        definition.sqlExpr: "if_else(user_embedding, user_embedding, [])"
         type: {
             type: TENSOR
             tensorCategory: DENSE
@@ -58,7 +58,7 @@ def test_multikey_derived_feature_to_config():
             user_embedding: {key: [user_id], feature: user_embedding}
             item_embedding: {key: [item_id], feature: item_embedding}
         }
-        definition: "similarity(user_embedding,item_embedding)"
+        definition.sqlExpr: "similarity(user_embedding,item_embedding)"
         type: {
             type: TENSOR
             tensorCategory: DENSE
@@ -88,7 +88,7 @@ def test_derived_feature_to_config_with_alias():
             viewer_embedding: {key: [viewer], feature: user_embedding}
             viewee_embedding: {key: [viewee], feature: user_embedding}
         }
-        definition: "distance(viewer_embedding, viewee_embedding)"
+        definition.sqlExpr: "distance(viewer_embedding, viewee_embedding)"
         type: {
             type: TENSOR
             tensorCategory: DENSE
@@ -129,7 +129,7 @@ def test_multi_key_derived_feature_to_config_with_alias():
             viewer_viewee_distance: {key: [viewer, viewee], feature: viewer_viewee_distance}
             viewee_viewer_distance: {key: [viewee, viewer], feature: viewer_viewee_distance}
         }
-        definition: "viewer_viewee_distance + viewee_viewer_distance"
+        definition.sqlExpr: "viewer_viewee_distance + viewee_viewer_distance"
         type: {
             type: TENSOR
             tensorCategory: DENSE
@@ -159,7 +159,7 @@ def test_derived_feature_on_multikey_anchored_feature_to_config():
         inputs: {
             user_embedding: {key: [viewer, viewee], feature: user_embedding}
         }
-        definition: "if_else(user_embedding, user_embedding, [])"
+        definition.sqlExpr: "if_else(user_embedding, user_embedding, [])"
         type: {
             type: TENSOR
             tensorCategory: DENSE

From 616d76e96ed24e45e3059de883d6aee56ff1ea20 Mon Sep 17 00:00:00 2001
From: Jinghui Mo <jmo@linkedin.com>
Date: Thu, 13 Oct 2022 16:34:52 -0400
Subject: [PATCH 16/68] Support SWA with groupBy to 1d tensor conversion (#748)

* Support SWA with groupby to 1d tensor conversion
---
 .../transformation/FDSConversionUtils.scala     | 11 ++++++++---
 .../offline/util/TestFDSConversionUtil.scala    | 17 ++++++++++++-----
 2 files changed, 20 insertions(+), 8 deletions(-)

diff --git a/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala b/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala
index 96a10a67c..25d96af11 100644
--- a/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/transformation/FDSConversionUtils.scala
@@ -2,14 +2,13 @@ package com.linkedin.feathr.offline.transformation
 
 import com.linkedin.feathr.common.exception.{ErrorLabel, FeathrException}
 import com.linkedin.feathr.common.tensor.TensorData
-
-import java.util
 import com.linkedin.feathr.common.util.CoercionUtils
 import com.linkedin.feathr.offline.util.FeaturizedDatasetUtils
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema
 import org.apache.spark.sql.types._
 
+import java.util
 import scala.collection.JavaConverters._
 import scala.collection.convert.Wrappers.JMapWrapper
 import scala.collection.mutable
@@ -253,7 +252,13 @@ private[offline] object FDSConversionUtils {
       case values: util.ArrayList[Any] =>
         values.asScala.toArray
       case values: mutable.WrappedArray[Any] =>
-        values.asInstanceOf[mutable.WrappedArray[Any]].toArray
+        if (values.nonEmpty && values(0).isInstanceOf[GenericRowWithSchema]) {
+          // Assuming the result is returned by SWA feature with groupBy, hence keeping only the
+          // feature value as an array and dropping the index info.
+          values.asInstanceOf[mutable.WrappedArray[GenericRowWithSchema]].map(v => v.get(v.size - 1)).toArray
+        } else {
+          values.toArray
+        }
       case values: List[Any] =>
         values.toArray
       case mapValues: Map[Integer, Any] =>
diff --git a/src/test/scala/com/linkedin/feathr/offline/util/TestFDSConversionUtil.scala b/src/test/scala/com/linkedin/feathr/offline/util/TestFDSConversionUtil.scala
index 3ab94e616..f3b75024e 100644
--- a/src/test/scala/com/linkedin/feathr/offline/util/TestFDSConversionUtil.scala
+++ b/src/test/scala/com/linkedin/feathr/offline/util/TestFDSConversionUtil.scala
@@ -3,18 +3,17 @@ package com.linkedin.feathr.offline.util
 import com.linkedin.feathr.common.TensorUtils
 import com.linkedin.feathr.common.tensor.{TensorType, Tensors}
 import com.linkedin.feathr.common.types.PrimitiveType
-
-import java.util
-import java.util.Collections
 import com.linkedin.feathr.offline.AssertFeatureUtils
 import com.linkedin.feathr.offline.transformation.FDSConversionUtils
 import org.apache.spark.sql.Row
-import org.apache.spark.sql.catalyst.expressions.GenericRow
+import org.apache.spark.sql.catalyst.expressions.{GenericRow, GenericRowWithSchema}
 import org.apache.spark.sql.types._
 import org.scalatest.testng.TestNGSuite
 import org.testng.Assert.{assertEquals, assertTrue}
 import org.testng.annotations.{DataProvider, Test}
 
+import java.util
+import java.util.Collections
 import scala.collection.mutable
 
 class TestFDSConversionUtil extends TestNGSuite {
@@ -141,10 +140,18 @@ class TestFDSConversionUtil extends TestNGSuite {
 
   @DataProvider
   def dataForTestConvertRawValueTo1DFDSDenseTensorRowTz(): Array[Array[Any]] = {
+    val eleType = StructType(
+        StructField("group", IntegerType, false) ::
+        StructField("value", IntegerType, false) :: Nil
+      )
+    val row1 = new GenericRowWithSchema(Array(1, 3), eleType)
+    val row2 = new GenericRowWithSchema(Array(2, 4), eleType)
     Array(
       Array(mutable.WrappedArray.make(Array(2.0f, 6.0f)), util.Arrays.asList(2.0f, 6.0f).toArray),
       Array(Array(1.1).toList, util.Arrays.asList(1.1).toArray),
-      Array(Map("a" -> 1.1), util.Arrays.asList(1.1).toArray)
+      Array(Map("a" -> 1.1), util.Arrays.asList(1.1).toArray),
+      // Simulate raw value return by SWA feature with groupBy
+      Array(mutable.WrappedArray.make(Array(row1, row2)), util.Arrays.asList(3, 4).toArray)
     )
   }
   @Test(dataProvider = "dataForTestConvertRawValueTo1DFDSDenseTensorRowTz")

From 8d7d41269a376f890917d2c1cd7ac86bfdc87102 Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Fri, 14 Oct 2022 15:34:45 -0700
Subject: [PATCH 17/68] Rijai/armfix (#742)

* Adding DevSkim linter to Github actions

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Making ARM instructions for Owner role and AAD App more clear

* Removing devskim file

* Reverting the changes to docker file to match with feathr/main
---
 docs/how-to-guides/azure-deployment-arm.md | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/docs/how-to-guides/azure-deployment-arm.md b/docs/how-to-guides/azure-deployment-arm.md
index 0d833abf0..7bc9a926f 100644
--- a/docs/how-to-guides/azure-deployment-arm.md
+++ b/docs/how-to-guides/azure-deployment-arm.md
@@ -6,7 +6,7 @@ parent: How-to Guides
 
 # Azure Resource Provisioning
 
-The provided Azure Resource Manager (ARM) template deploys the following resources, please make sure you have enough quota in the subscription and region you are deploying this in. You can view your quota and make request on Azure [portal](https://ms.portal.azure.com/#view/Microsoft_Azure_Capacity/QuotaMenuBlade/~/overview)
+The provided Azure Resource Manager (ARM) template deploys the following resources, please make sure you have enough quota in the subscription and region you are deploying this in. You can view your quota and make request on Azure [portal](https://ms.portal.azure.com/#view/Microsoft_Azure_Capacity/QuotaMenuBlade/~/overview).
 
 1. Azure Storage account
 2. Azure Purview (metadata store if you selected Azure-Purview as registry backend)
@@ -17,9 +17,9 @@ The provided Azure Resource Manager (ARM) template deploys the following resourc
 7. Azure Event Hub
 8. Azure Redis
 
-Please note, you need to have **owner access** in the resource group you are deploying this in. Owner access is required to assign role to managed identity within ARM template so it can access key vault and store secrets. If you don't have such permission, you might want to contact your IT admin to see if they can do that.
+### Please Note: you need to have the **Owner Role** in the resource group you are deploying this in. Owner access is required to assign role to managed identity within the ARM template so it can access key vault and store secrets. It is also required by the permission section in our sample notebooks. If you don't have such permission, you might want to contact your IT admin to see if they can do that.
 
-Although we recommend end users deploy the resources using the ARM template, we understand that in many situations where users want to reuse existing resources instead of creating new resources; or users have many other permission issues. See [Manually connecting existing resources](#manually-connecting-existing-resources) for more details.
+Although we recommend end users deploy the resources using the ARM template, we understand that in many situations where users want to reuse existing resources instead of creating new resources; or users may have permission issues. See [Manually connecting existing resources](#manually-connecting-existing-resources) for more details.
 
 ## Architecture
 
@@ -34,10 +34,12 @@ Feathr has native cloud integration and getting started with Feathr is very stra
 
 The very first step is to create an Azure Active Directory (AAD) application to enable authentication on the Feathr UI (which gets created as part of the deployment script). Currently it is not possible to create one through ARM template but you can easily create one by running the following CLI commands in the [Cloud Shell](https://shell.azure.com/bash).
 
+### Please make note of the Client ID and Tenant ID for the AAD app, you will need it in the ARM template deployment section.
+
 ```bash
 # This is the prefix you want to name your resources with, make a note of it, you will need it during deployment.
 #  Note: please keep the `resourcePrefix` short (less than 15 chars), since some of the Azure resources need the full name to be less than 24 characters. Only lowercase alphanumeric characters are allowed for resource prefix.
-resource_prefix="userprefix1"
+resource_prefix="yourprefix"
 
 # Please don't change this name, a corresponding webapp with same name gets created in subsequent steps.
 sitename="${resource_prefix}webapp"

From 4bdcd574fde47ff3072a83b507d92a3fe612de49 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Sat, 15 Oct 2022 06:52:43 +0800
Subject: [PATCH 18/68] bump version to 0.8.2 (#722)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 build.sbt                                                     | 2 +-
 docs/how-to-guides/azure_resource_provision.json              | 2 +-
 feathr_project/feathr/constants.py                            | 2 +-
 feathr_project/setup.py                                       | 2 +-
 feathr_project/test/test_user_workspace/feathr_config.yaml    | 4 ++--
 .../test_user_workspace/feathr_config_registry_purview.yaml   | 4 ++--
 .../feathr_config_registry_purview_rbac.yaml                  | 4 ++--
 .../test/test_user_workspace/feathr_config_registry_sql.yaml  | 4 ++--
 .../test_user_workspace/feathr_config_registry_sql_rbac.yaml  | 4 ++--
 9 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/build.sbt b/build.sbt
index 2919ddae6..d85f99016 100644
--- a/build.sbt
+++ b/build.sbt
@@ -2,7 +2,7 @@ import sbt.Keys.publishLocalConfiguration
 
 ThisBuild / resolvers += Resolver.mavenLocal
 ThisBuild / scalaVersion     := "2.12.15"
-ThisBuild / version          := "0.8.0"
+ThisBuild / version          := "0.8.2"
 ThisBuild / organization     := "com.linkedin.feathr"
 ThisBuild / organizationName := "linkedin"
 val sparkVersion = "3.1.3"
diff --git a/docs/how-to-guides/azure_resource_provision.json b/docs/how-to-guides/azure_resource_provision.json
index 03d175052..6ab77a419 100644
--- a/docs/how-to-guides/azure_resource_provision.json
+++ b/docs/how-to-guides/azure_resource_provision.json
@@ -111,7 +111,7 @@
       "destinationBacpacBlobUrl": "[concat('https://',variables('dlsName'),'.blob.core.windows.net/',variables('dlsFsName'),'/',variables('bacpacBlobName'))]",
       "bacpacDeploymentScriptName": "CopyBacpacFile",
       "bacpacDbExtensionName": "registryRbacDbImport",
-      "preBuiltdockerImage": "feathrfeaturestore/feathr-registry:releases-v0.8.0"
+      "preBuiltdockerImage": "feathrfeaturestore/feathr-registry:releases-v0.8.2"
     },
     "functions": [],
     "resources": [
diff --git a/feathr_project/feathr/constants.py b/feathr_project/feathr/constants.py
index 6686f14ac..c4cbad7ff 100644
--- a/feathr_project/feathr/constants.py
+++ b/feathr_project/feathr/constants.py
@@ -28,7 +28,7 @@
 TYPEDEF_ARRAY_DERIVED_FEATURE=f"array<feathr_derived_feature_{REGISTRY_TYPEDEF_VERSION}>"
 TYPEDEF_ARRAY_ANCHOR_FEATURE=f"array<feathr_anchor_feature_{REGISTRY_TYPEDEF_VERSION}>"
 
-FEATHR_MAVEN_ARTIFACT="com.linkedin.feathr:feathr_2.12:0.8.0"
+FEATHR_MAVEN_ARTIFACT="com.linkedin.feathr:feathr_2.12:0.8.2"
 
 JOIN_CLASS_NAME="com.linkedin.feathr.offline.job.FeatureJoinJob"
 GEN_CLASS_NAME="com.linkedin.feathr.offline.job.FeatureGenJob"
\ No newline at end of file
diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index ce7ec14d6..7c3e10178 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -7,7 +7,7 @@
 
 setup(
     name='feathr',
-    version='0.8.0',
+    version='0.8.2',
     long_description=long_description,
     long_description_content_type="text/markdown",
     author_email="feathr-technical-discuss@lists.lfaidata.foundation",
diff --git a/feathr_project/test/test_user_workspace/feathr_config.yaml b/feathr_project/test/test_user_workspace/feathr_config.yaml
index e67c803ef..b0f2b259c 100644
--- a/feathr_project/test/test_user_workspace/feathr_config.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config.yaml
@@ -82,7 +82,7 @@ spark_config:
     # Feathr Job configuration. Support local paths, path start with http(s)://, and paths start with abfs(s)://
     # this is the default location so end users don't have to compile the runtime again.
     # feathr_runtime_location: wasbs://public@azurefeathrstorage.blob.core.windows.net/feathr-assembly-LATEST.jar
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
   databricks:
     # workspace instance
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
@@ -93,7 +93,7 @@ spark_config:
     # Feathr Job location. Support local paths, path start with http(s)://, and paths start with dbfs:/
     work_dir: 'dbfs:/feathr_getting_started'
     # this is the default location so end users don't have to compile the runtime again.
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
index f716da0b4..003e424eb 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
index c842bc702..0722a34d8 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
index dcb73d827..507b096cb 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
index 29c6889e8..9403cb190 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
 
 online_store:
   redis:

From 3c407c3aec9f3f435f177854a664b49de5d167ff Mon Sep 17 00:00:00 2001
From: Chang Yong Lik <51813538+ahlag@users.noreply.github.com>
Date: Sat, 15 Oct 2022 08:17:42 +0900
Subject: [PATCH 19/68] Added latest deltalake version (#735)

* Added latest deltalake version

* Changed == to <= for deltalake installation

* Changed <= to >=
---
 feathr_project/setup.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index 7c3e10178..47d105061 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -35,8 +35,7 @@
         "pyarrow<=9.0.0",
         "pyspark>=3.1.2",
         "python-snappy<=0.6.1",
-        # fixing https://github.com/feathr-ai/feathr/issues/687
-        "deltalake<=0.5.8",
+        "deltalake>=0.6.2",
         "graphlib_backport<=1.0.3",
         "protobuf==3.*",
         "confluent-kafka<=1.9.2",

From 1465f6472094da5e710c832c3d4691e694644d50 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E5=BE=90=E8=BE=B0?= <windoze@0d0a.com>
Date: Sat, 15 Oct 2022 13:15:57 +0800
Subject: [PATCH 20/68] #474 Disable local mode (#738)

---
 .../com/linkedin/feathr/offline/util/SourceUtils.scala      | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/main/scala/com/linkedin/feathr/offline/util/SourceUtils.scala b/src/main/scala/com/linkedin/feathr/offline/util/SourceUtils.scala
index e9d3a2bf1..a70c11fd0 100644
--- a/src/main/scala/com/linkedin/feathr/offline/util/SourceUtils.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/util/SourceUtils.scala
@@ -652,11 +652,7 @@ private[offline] object SourceUtils {
         ss.read.format("csv").option("header", "true").option("delimiter", csvDelimiterOption).load(inputData.inputPath)
       }
       case _ => {
-        if (ss.sparkContext.isLocal){
-          getLocalDF(ss, inputData.inputPath, dataLoaderHandlers)
-        } else {
-          loadAsDataFrame(ss, SimplePath(inputData.inputPath),dataLoaderHandlers)
-        }
+        loadAsDataFrame(ss, SimplePath(inputData.inputPath),dataLoaderHandlers)
       }
     }
   }

From d59ea4bdad6606683470883e686a56262c5f10b3 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E5=BE=90=E8=BE=B0?= <windoze@0d0a.com>
Date: Sat, 15 Oct 2022 13:40:58 +0800
Subject: [PATCH 21/68] Allow recreating entities for PurView registry (#691)

* Allow recreating entities for PurView registry

* Use constants
---
 .../registry/_feature_registry_purview.py     | 46 ++++++++++++++++
 .../registry/purview_registry.py              | 54 +++++++++++++++----
 2 files changed, 91 insertions(+), 9 deletions(-)

diff --git a/feathr_project/feathr/registry/_feature_registry_purview.py b/feathr_project/feathr/registry/_feature_registry_purview.py
index c564e8796..a6b2c17e4 100644
--- a/feathr_project/feathr/registry/_feature_registry_purview.py
+++ b/feathr_project/feathr/registry/_feature_registry_purview.py
@@ -3,6 +3,7 @@
 import inspect
 import itertools
 import os
+import re
 import sys
 import ast
 import types
@@ -44,6 +45,25 @@
 
 from feathr.constants import *
 
+def _to_snake(d, level: int = 0):
+    """
+    Convert `string`, `list[string]`, or all keys in a `dict` into snake case
+    The maximum length of input string or list is 100, or it will be truncated before being processed, for dict, the exception will be thrown if it has more than 100 keys.
+    the maximum nested level is 10, otherwise the exception will be thrown
+    """
+    if level >= 10:
+        raise ValueError("Too many nested levels")
+    if isinstance(d, str):
+        d = d[:100]
+        return re.sub(r'(?<!^)(?=[A-Z])', '_', d).lower()
+    if isinstance(d, list):
+        d = d[:100]
+        return [_to_snake(i, level + 1) if isinstance(i, (dict, list)) else i for i in d]
+    if len(d) > 100:
+        raise ValueError("Dict has too many keys")
+    return {_to_snake(a, level + 1): _to_snake(b, level + 1) if isinstance(b, (dict, list)) else b for a, b in d.items()}
+
+
 class _PurviewRegistry(FeathrRegistry):
     """
     Initializes the feature registry, doing the following:
@@ -720,6 +740,32 @@ def upload_single_entity_to_purview(self,entity:Union[AtlasEntity,AtlasProcess])
         The entity itself will also be modified, fill the GUID with real GUID in Purview.
         In order to avoid having concurrency issue, and provide clear guidance, this method only allows entity uploading once at a time.
         '''
+        try:
+            """
+            Try to find existing entity/process first, if found, return the existing entity's GUID
+            """
+            id = self.get_entity_id(entity.qualifiedName)
+            response =  self.purview_client.get_entity(id)['entities'][0]
+            j = entity.to_json()
+            if j["typeName"] == response["typeName"]:
+                if j["typeName"] == "Process":
+                    if response["attributes"]["qualifiedName"] != j["attributes"]["qualifiedName"]:
+                        raise RuntimeError("The requested entity %s conflicts with the existing entity in PurView" % j["attributes"]["qualifiedName"])
+                else:
+                    if "type" in response['attributes'] and response["typeName"] in (TYPEDEF_ANCHOR_FEATURE, TYPEDEF_DERIVED_FEATURE):
+                        conf = ConfigFactory.parse_string(response['attributes']['type'])
+                        response['attributes']['type'] = dict(conf)
+                    keys = set([_to_snake(key) for key in j["attributes"].keys()]) - set(["qualified_name"])
+                    keys.add("qualifiedName")
+                    for k in keys:
+                        if response["attributes"][k] != j["attributes"][k]:
+                            raise RuntimeError("The requested entity %s conflicts with the existing entity in PurView" % j["attributes"]["qualifiedName"])
+                return response["guid"]
+            else:
+                raise RuntimeError("The requested entity %s conflicts with the existing entity in PurView" % j["attributes"]["qualifiedName"])
+        except AtlasException as e:
+            pass
+        
         try:
             entity.lastModifiedTS="0"
             result = self.purview_client.upload_entities([entity])
diff --git a/registry/purview-registry/registry/purview_registry.py b/registry/purview-registry/registry/purview_registry.py
index 9f5f47560..15a650167 100644
--- a/registry/purview-registry/registry/purview_registry.py
+++ b/registry/purview-registry/registry/purview_registry.py
@@ -5,6 +5,9 @@
 from urllib.error import HTTPError
 from uuid import UUID
 
+from registry.models import to_snake
+from pyapacheatlas.core.util import AtlasException
+
 from azure.identity import DefaultAzureCredential
 from loguru import logger
 from pyapacheatlas.auth.azcredential import AzCredentialWrapper
@@ -20,6 +23,9 @@
 Label_BelongsTo = "BELONGSTO"
 Label_Consumes = "CONSUMES"
 Label_Produces = "PRODUCES"
+TYPEDEF_DERIVED_FEATURE="feathr_derived_feature_v1"
+TYPEDEF_ANCHOR_FEATURE="feathr_anchor_feature_v1"
+
 TYPEDEF_ARRAY_ANCHOR=f"array<feathr_anchor_v1>"
 TYPEDEF_ARRAY_DERIVED_FEATURE=f"array<feathr_derived_feature_v1>"
 TYPEDEF_ARRAY_ANCHOR_FEATURE=f"array<feathr_anchor_feature_v1>"
@@ -568,17 +574,47 @@ def _register_feathr_feature_types(self):
     def _upload_entity_batch(self, entity_batch:list[AtlasEntity]):
         # we only support entity creation, update is not supported. 
         # setting lastModifiedTS ==0 will ensure this, if another entity with ts>=1 exist
-        # upload funtion will fail with 412 Precondition fail.
+        # upload function will fail with 412 Precondition fail.
         for entity in entity_batch:
-            entity.lastModifiedTS="0"
-            results = self.purview_client.upload_entities(
-                batch=entity)
-            if results:
-                dict = {x.guid: x for x in entity_batch}
-                for k, v in results['guidAssignments'].items():
-                    dict[k].guid = v
+            self._upload_single_entity(entity)
+    
+    def _upload_single_entity(self, entity:AtlasEntity):
+        try:
+            """
+            Try to find existing entity/process first, if found, return the existing entity's GUID
+            """
+            id = self.get_entity_id(entity.qualifiedName)
+            response =  self.purview_client.get_entity(id)['entities'][0]
+            j = entity.to_json()
+            if j["typeName"] == response["typeName"]:
+                if j["typeName"] == "Process":
+                    if response["attributes"]["qualifiedName"] != j["attributes"]["qualifiedName"]:
+                        raise RuntimeError("The requested entity %s conflicts with the existing entity in PurView" % j["attributes"]["qualifiedName"])
+                else:
+                    if "type" in response['attributes'] and response["typeName"] in (TYPEDEF_ANCHOR_FEATURE, TYPEDEF_DERIVED_FEATURE):
+                        conf = ConfigFactory.parse_string(response['attributes']['type'])
+                        response['attributes']['type'] = dict(conf)
+                    keys = set([to_snake(key) for key in j["attributes"].keys()]) - set(["qualified_name"])
+                    keys.add("qualifiedName")
+                    for k in keys:
+                        if response["attributes"][k] != j["attributes"][k]:
+                            raise RuntimeError("The requested entity %s conflicts with the existing entity in PurView" % j["attributes"]["qualifiedName"])
+                entity.guid = response["guid"]
+                return
             else:
-                raise RuntimeError("Feature registration failed.", results)            
+                raise RuntimeError("The requested entity %s conflicts with the existing entity in PurView" % j["attributes"]["qualifiedName"])
+        except AtlasException as e:
+            pass
+
+        entity.lastModifiedTS="0"
+        results = self.purview_client.upload_entities(
+            batch=entity)
+        if results:
+            d = {x.guid: x for x in [entity]}
+            for k, v in results['guidAssignments'].items():
+                d[k].guid = v
+        else:
+            raise RuntimeError("Feature registration failed.", results)
             
     def _generate_fully_qualified_name(self, segments):
         return self.registry_delimiter.join(segments)

From b6cff14ecbf77a147a53653056e9efdd3f1fb6a9 Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Sun, 16 Oct 2022 19:24:52 -0700
Subject: [PATCH 22/68] Adding DevSkim linter to Github actions (#657)

* Adding DevSkim linter to Github actions
* Ignoring .git and test folder
---
 .github/workflows/devskim-security-linter.yml | 37 +++++++++++++++++++
 1 file changed, 37 insertions(+)
 create mode 100644 .github/workflows/devskim-security-linter.yml

diff --git a/.github/workflows/devskim-security-linter.yml b/.github/workflows/devskim-security-linter.yml
new file mode 100644
index 000000000..e7e33b7ab
--- /dev/null
+++ b/.github/workflows/devskim-security-linter.yml
@@ -0,0 +1,37 @@
+# This workflow uses actions that are not certified by GitHub.
+# They are provided by a third-party (Microsoft) and are governed by
+# separate terms of service, privacy policy, and support
+# documentation.
+# For more details about Devskim, visit https://github.com/marketplace/actions/devskim 
+
+name: DevSkim
+
+on:
+  push:
+    branches: [ "main" ]
+  pull_request:
+    branches: [ "main" ]
+  schedule:
+    - cron: '00 4 * * *'
+
+jobs:
+  lint:
+    name: DevSkim
+    runs-on: ubuntu-20.04
+    permissions:
+      actions: read
+      contents: read
+      security-events: write
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v3
+
+      - name: Run DevSkim scanner
+        uses: microsoft/DevSkim-Action@v1
+        with:
+          ignore-globs: "**/.git/**,**/test/**"
+        
+      - name: Upload DevSkim scan results to GitHub Security tab
+        uses: github/codeql-action/upload-sarif@v2
+        with:
+          sarif_file: devskim-results.sarif

From 3d12944e952bf3dd40bb7ee56f40b32fd31f14d8 Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Mon, 17 Oct 2022 16:26:29 +0800
Subject: [PATCH 23/68] Fix icons in UI cannot auto scale (#737) (#744)

* Fix icons in UI cannot auto scale (#737)

* Fix home.css code style issue
---
 ui/.vscode/settings.json   |   9 +-
 ui/src/pages/home/home.css |  23 ++++
 ui/src/pages/home/home.tsx | 210 +++++++++++--------------------------
 3 files changed, 93 insertions(+), 149 deletions(-)
 create mode 100644 ui/src/pages/home/home.css

diff --git a/ui/.vscode/settings.json b/ui/.vscode/settings.json
index 24fe97ae7..c8e624dc0 100644
--- a/ui/.vscode/settings.json
+++ b/ui/.vscode/settings.json
@@ -4,5 +4,12 @@
   },
   "editor.defaultFormatter": "esbenp.prettier-vscode",
   "editor.formatOnSave": true,
-  "eslint.workingDirectories": [{ "mode": "auto" }]
+  "eslint.workingDirectories": [
+    {
+      "mode": "auto"
+    }
+  ],
+  "[css]": {
+    "editor.defaultFormatter": "esbenp.prettier-vscode"
+  }
 }
diff --git a/ui/src/pages/home/home.css b/ui/src/pages/home/home.css
new file mode 100644
index 000000000..5c4a3b8a8
--- /dev/null
+++ b/ui/src/pages/home/home.css
@@ -0,0 +1,23 @@
+.home .ant-card {
+  box-shadow: 5px 8px 15px 5px rgba(208, 216, 243, 0.6);
+  border-radius: 8px;
+}
+
+.home .card-meta {
+  display: flex;
+}
+
+.home .card-meta .ant-card-meta-avatar {
+  max-width: 80px;
+  flex-basis: 30%;
+  box-sizing: border-box;
+}
+
+.home .card-meta .ant-card-meta-avatar > span {
+  width: 100%;
+}
+
+.home .card-meta .ant-card-meta-avatar svg {
+  width: 100%;
+  height: auto;
+}
diff --git a/ui/src/pages/home/home.tsx b/ui/src/pages/home/home.tsx
index 240ab8901..88732ffeb 100644
--- a/ui/src/pages/home/home.tsx
+++ b/ui/src/pages/home/home.tsx
@@ -8,17 +8,42 @@ import {
   ProjectOutlined,
 } from "@ant-design/icons";
 
+import "./home.css";
+
 const { Title } = Typography;
+const { Meta } = Card;
+
+const features = [
+  {
+    icon: <ProjectOutlined style={{ color: "#177ddc" }} />,
+    title: "Projects",
+    link: "/projects",
+    linkText: "See all",
+  },
+  {
+    icon: <DatabaseOutlined style={{ color: "#219ebc" }} />,
+    title: "Sources",
+    link: "/dataSources",
+    linkText: "See all",
+  },
+  {
+    icon: <CopyOutlined style={{ color: "#ffb703" }} />,
+    title: "Features",
+    link: "/features",
+    linkText: "See all",
+  },
+  {
+    icon: <EyeOutlined style={{ color: "#fb8500" }} />,
+    title: "Monitoring",
+    link: "/monitoring",
+    linkText: "See all",
+  },
+];
 
 const Home = () => {
   return (
-    <div className="page">
-      <Card
-        style={{
-          boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-          borderRadius: "8px",
-        }}
-      >
+    <div className="page home">
+      <Card>
         <Title level={2}>Welcome to Feathr Feature Store</Title>
         <span>
           You can use Feathr UI to search features, identify data sources, track
@@ -33,141 +58,36 @@ const Home = () => {
           </a>
         </span>
       </Card>
-      <Row justify="space-between">
-        <Col span={6}>
-          <Card
-            style={{
-              marginTop: "15px",
-              marginRight: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
-            <Row>
-              <Col span={6}>
-                <ProjectOutlined
-                  style={{ fontSize: "80px", color: "#177ddc" }}
+      <Row gutter={16} style={{ marginTop: 16 }}>
+        {features.map((item) => {
+          return (
+            <Col
+              key={item.title}
+              xl={6}
+              lg={12}
+              sm={24}
+              xs={24}
+              style={{ marginBottom: 16 }}
+            >
+              <Card>
+                <Meta
+                  className="card-meta"
+                  avatar={item.icon}
+                  title={
+                    <Title level={2} ellipsis>
+                      {item.title}
+                    </Title>
+                  }
+                  description={<Link to={item.link}>{item.linkText}</Link>}
                 />
-              </Col>
-              <Col span={18}>
-                <Row>
-                  <Col span={24}>
-                    <Title level={2}>Projects</Title>
-                  </Col>
-                </Row>
-                <Row>
-                  <Col span={24}>
-                    <span>
-                      <Link to="/projects">See all</Link>
-                    </span>
-                  </Col>
-                </Row>
-              </Col>
-            </Row>
-          </Card>
-        </Col>
-        <Col span={6}>
-          <Card
-            style={{
-              marginTop: "15px",
-              marginRight: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
-            <Row>
-              <Col span={6}>
-                <DatabaseOutlined
-                  style={{ fontSize: "80px", color: "#219ebc" }}
-                />
-              </Col>
-              <Col span={18}>
-                <Row>
-                  <Col span={24}>
-                    <Title level={2}>Sources</Title>
-                  </Col>
-                </Row>
-                <Row>
-                  <Col span={24}>
-                    <span>
-                      <Link to="/dataSources">See all</Link>
-                    </span>
-                  </Col>
-                </Row>
-              </Col>
-            </Row>
-          </Card>
-        </Col>
-        <Col span={6}>
-          <Card
-            style={{
-              marginTop: "15px",
-              marginRight: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
-            <Row>
-              <Col span={6}>
-                <CopyOutlined style={{ fontSize: "80px", color: "#ffb703" }} />
-              </Col>
-              <Col span={18}>
-                <Row>
-                  <Col span={24}>
-                    <Title level={2}>Features</Title>
-                  </Col>
-                </Row>
-                <Row>
-                  <Col span={24}>
-                    <span>
-                      <Link to="/features">See all</Link>
-                    </span>
-                  </Col>
-                </Row>
-              </Col>
-            </Row>
-          </Card>
-        </Col>
-        <Col span={6}>
-          <Card
-            style={{
-              marginTop: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
-            <Row>
-              <Col span={6}>
-                <EyeOutlined style={{ fontSize: "80px", color: "#fb8500" }} />
-              </Col>
-              <Col span={18}>
-                <Row>
-                  <Col span={24}>
-                    <Title level={2}>Monitoring</Title>
-                  </Col>
-                </Row>
-                <Row>
-                  <Col span={24}>
-                    <span>
-                      <Link to="/monitoring">See all</Link>
-                    </span>
-                  </Col>
-                </Row>
-              </Col>
-            </Row>
-          </Card>
-        </Col>
+              </Card>
+            </Col>
+          );
+        })}
       </Row>
-      <Row>
-        <Col span={16}>
-          <Card
-            style={{
-              marginTop: "15px",
-              marginRight: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
+      <Row gutter={16}>
+        <Col xl={16} lg={24} sm={24} xs={24} style={{ marginBottom: 16 }}>
+          <Card>
             <Title level={2}>Need help to get started?</Title>
             Explore the following resources to get started with Feathr:
             <ul>
@@ -237,14 +157,8 @@ const Home = () => {
             </p>
           </Card>
         </Col>
-        <Col span={8}>
-          <Card
-            style={{
-              marginTop: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
+        <Col xl={8} lg={24} sm={24} xs={24} style={{ marginBottom: 16 }}>
+          <Card>
             <Title level={2}>Recent Activity</Title>
             <span>Under construction</span>
           </Card>

From 3070a863d69f767658ca4adc819f6a3aac71ea18 Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Mon, 17 Oct 2022 16:30:25 +0800
Subject: [PATCH 24/68] Expose 'timePartitionPattern' in Python API [ WIP ]
 (#714)

* Expose 'timePartitionPattern'

* add test case

* Add test cases and docstring

* delete local files

* quick fix

Co-authored-by: enya-yx <enya@LAPTOP-NBH6175C.redmond.corp.microsoft.com>
Co-authored-by: enya-yx <enya@v-ellinlu-2.fareast.corp.microsoft.com>
---
 feathr_project/feathr/definition/source.py    | 21 ++++++-
 .../spark_provider/_synapse_submission.py     |  2 +
 feathr_project/test/test_azure_spark_e2e.py   | 36 +++++++++++-
 feathr_project/test/test_feature_anchor.py    | 58 ++++++++++++++++++-
 feathr_project/test/test_fixture.py           | 28 +++++++++
 5 files changed, 142 insertions(+), 3 deletions(-)

diff --git a/feathr_project/feathr/definition/source.py b/feathr_project/feathr/definition/source.py
index b9721a1a5..3ca8925df 100644
--- a/feathr_project/feathr/definition/source.py
+++ b/feathr_project/feathr/definition/source.py
@@ -100,14 +100,30 @@ class HdfsSource(Source):
                                                     - `epoch` (seconds since epoch), for example `1647737463`
                                                     - `epoch_millis` (milliseconds since epoch), for example `1647737517761`
                                                     - Any date formats supported by [SimpleDateFormat](https://docs.oracle.com/javase/8/docs/api/java/text/SimpleDateFormat.html).
+        
         registry_tags: A dict of (str, str) that you can pass to feature registry for better organization. For example, you can use {"deprecated": "true"} to indicate this source is deprecated, etc.
+        time_partition_pattern(Optional[str]): Format of the time partitioned feature data. e.g. yyyy/MM/DD. All formats supported in dateTimeFormatter.
+        config:
+            timeSnapshotHdfsSource: 
+            {  
+                location: 
+                {    
+                    path: "/data/somePath/daily"  
+                }  
+                timePartitionPattern: "yyyy/MM/dd" 
+            }
+        Given the above HDFS path: /data/somePath/daily, 
+        then the expectation is that the following sub directorie(s) should exist:
+        /data/somePath/daily/{yyyy}/{MM}/{dd}
+
     """
 
-    def __init__(self, name: str, path: str, preprocessing: Optional[Callable] = None, event_timestamp_column: Optional[str] = None, timestamp_format: Optional[str] = "epoch", registry_tags: Optional[Dict[str, str]] = None) -> None:
+    def __init__(self, name: str, path: str, preprocessing: Optional[Callable] = None, event_timestamp_column: Optional[str] = None, timestamp_format: Optional[str] = "epoch", registry_tags: Optional[Dict[str, str]] = None, time_partition_pattern: Optional[str] = None) -> None:
         super().__init__(name, event_timestamp_column,
                          timestamp_format, registry_tags=registry_tags)
         self.path = path
         self.preprocessing = preprocessing
+        self.time_partition_pattern = time_partition_pattern
         if path.startswith("http"):
             logger.warning(
                 "Your input path {} starts with http, which is not supported. Consider using paths starting with wasb[s]/abfs[s]/s3.", path)
@@ -116,6 +132,9 @@ def to_feature_config(self) -> str:
         tm = Template("""  
             {{source.name}}: {
                 location: {path: "{{source.path}}"}
+                {% if source.time_partition_pattern %}
+                timePartitionPattern: "{{source.time_partition_pattern}}"
+                {% endif %}
                 {% if source.event_timestamp_column %}
                     timeWindowParameters: {
                         timestampColumn: "{{source.event_timestamp_column}}"
diff --git a/feathr_project/feathr/spark_provider/_synapse_submission.py b/feathr_project/feathr/spark_provider/_synapse_submission.py
index 010444715..5b55a3b06 100644
--- a/feathr_project/feathr/spark_provider/_synapse_submission.py
+++ b/feathr_project/feathr/spark_provider/_synapse_submission.py
@@ -432,6 +432,8 @@ def download_file(self, target_adls_directory: str, local_dir_cache: str):
 
         # returns the paths to all the files in the target director in ADLS
         # get all the paths that are not under a directory
+        test_paths = self.file_system_client.get_paths(
+            path=parse_result.path, recursive=False)
         result_paths = [basename(file_path.name) for file_path in self.file_system_client.get_paths(
             path=parse_result.path, recursive=False) if not file_path.is_directory]
 
diff --git a/feathr_project/test/test_azure_spark_e2e.py b/feathr_project/test/test_azure_spark_e2e.py
index d2aa0b032..9e452d2d0 100644
--- a/feathr_project/test/test_azure_spark_e2e.py
+++ b/feathr_project/test/test_azure_spark_e2e.py
@@ -20,7 +20,7 @@
 from feathr import ValueType
 from feathr.utils.job_utils import get_result_df
 from feathrcli.cli import init
-from test_fixture import (basic_test_setup, get_online_test_table_name)
+from test_fixture import (basic_test_setup, get_online_test_table_name, time_partition_pattern_test_setup)
 from test_utils.constants import Constants
 
 # make sure you have run the upload feature script before running these tests
@@ -58,6 +58,40 @@ def test_feathr_materialize_to_offline():
     res_df = get_result_df(client, "avro", output_path + "/df0/daily/2020/05/20")
     assert res_df.shape[0] > 0
 
+def test_feathr_materialize_with_time_partition_pattern():
+    """
+    Test FeathrClient() using HdfsSource with 'timePartitionPattern'.
+    """
+    test_workspace_dir = Path(
+        __file__).parent.resolve() / "test_user_workspace"
+    # os.chdir(test_workspace_dir)
+
+    client: FeathrClient = time_partition_pattern_test_setup(os.path.join(test_workspace_dir, "feathr_config.yaml"))
+
+    backfill_time = BackfillTime(start=datetime(
+        2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))
+
+    now = datetime.now()
+    if client.spark_runtime == 'databricks':
+        output_path = ''.join(['dbfs:/feathrazure_cijob_materialize_offline_','_', str(now.minute), '_', str(now.second), ""])
+    else:
+        output_path = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/feathrazure_cijob_materialize_offline_','_', str(now.minute), '_', str(now.second), ""])
+    offline_sink = HdfsSink(output_path=output_path)
+    settings = MaterializationSettings("nycTaxiTable",
+                                       sinks=[offline_sink],
+                                       feature_names=[
+                                           "f_location_avg_fare", "f_location_max_fare"],
+                                       backfill_time=backfill_time)
+    client.materialize_features(settings)
+    # assuming the job can successfully run; otherwise it will throw exception
+    client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
+
+    # download result and just assert the returned result is not empty
+    # by default, it will write to a folder appended with date
+    res_df = get_result_df(client, "avro", output_path + "/df0/daily/2020/05/20")
+    assert res_df.shape[0] > 0
+
+
 def test_feathr_online_store_agg_features():
     """
     Test FeathrClient() get_online_features and batch_get can get data correctly.
diff --git a/feathr_project/test/test_feature_anchor.py b/feathr_project/test/test_feature_anchor.py
index d5e6701b8..1fabeec67 100644
--- a/feathr_project/test/test_feature_anchor.py
+++ b/feathr_project/test/test_feature_anchor.py
@@ -167,4 +167,60 @@ def test_agg_anchor_to_config():
                 }
             }
         """
-    assert ''.join(agg_anchor.to_feature_config().split()) == ''.join(expected_agg_feature_config.split())
\ No newline at end of file
+    assert ''.join(agg_anchor.to_feature_config().split()) == ''.join(expected_agg_feature_config.split())
+
+def test_time_partition_to_config():
+    batch_source = HdfsSource(name="testTimePartitionSource",
+                          path="abfss://public@azurefeathrstorage.blob.core.windows.net/sample_data/time_partition_pattern",
+                          time_partition_pattern="yyyy/MM/dd"
+                          )
+    key = TypedKey(key_column="key0",
+               key_column_type=ValueType.INT32)
+    agg_features = [
+        Feature(name="f_loc_avg",
+            key=[key],
+            feature_type=FLOAT,
+                transform="f_location_avg_fare"),
+        Feature(name="f_loc_max",
+            feature_type=FLOAT,
+            key=[key],
+            transform="f_location_max_fare"),
+        ]
+    agg_anchor = FeatureAnchor(name="testTimePartitionFeaturesSource",
+                           source=batch_source,
+                           features=agg_features)
+    expected_time_partition_config = """
+        anchors: {
+            testTimePartitionFeatures: {
+                source: testTimePartitionSource
+                key.sqlExpr: [key0]
+                features: {
+                    f_loc_avg: {
+                        def.sqlExpr: "f_location_avg_fare"
+                        type: {
+                            type: TENSOR
+                            tensorCategory: DENSE
+                            dimensionType: []
+                            valType: FLOAT
+                        }
+                    }       
+                    f_loc_max: {
+                        def.sqlExpr: "f_location_max_fare"
+                        type: {
+                            type: TENSOR
+                            tensorCategory: DENSE
+                            dimensionType: []
+                            valType: FLOAT
+                        }
+                    }
+                }
+            }
+        }
+        sources: {
+            testTimePartitionSource: {
+                location: {path: "abfss://public@azurefeathrstorage.blob.core.windows.net/sample_data/time_partition_pattern"}
+                timePartitionPattern: "yyyy/MM/dd"
+            }   
+        }
+    """
+    assert ''.join(agg_anchor.to_feature_config().split()) == ''.join(expected_time_partition_config.split())
\ No newline at end of file
diff --git a/feathr_project/test/test_fixture.py b/feathr_project/test/test_fixture.py
index c048eff7c..637e74202 100644
--- a/feathr_project/test/test_fixture.py
+++ b/feathr_project/test/test_fixture.py
@@ -88,6 +88,34 @@ def basic_test_setup(config_path: str):
 
     return client
 
+def time_partition_pattern_test_setup(config_path: str):
+    now = datetime.now()
+    # set workspace folder by time; make sure we don't have write conflict if there are many CI tests running
+    os.environ['SPARK_CONFIG__DATABRICKS__WORK_DIR'] = ''.join(['dbfs:/feathrazure_cijob','_', str(now.minute), '_', str(now.second), '_', str(now.microsecond)]) 
+    os.environ['SPARK_CONFIG__AZURE_SYNAPSE__WORKSPACE_DIR'] = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_github_ci','_', str(now.minute), '_', str(now.second) ,'_', str(now.microsecond)]) 
+    client = FeathrClient(config_path=config_path)
+    batch_source = HdfsSource(name="testTimePartitionSource",
+                          path="wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/time_partition_pattern/daily",
+                          time_partition_pattern="yyyy/MM/dd"
+                          )
+    key = TypedKey(key_column="key0",
+               key_column_type=ValueType.INT32)
+    agg_features = [
+    Feature(name="f_loc_avg",
+            key=[key],
+            feature_type=FLOAT,
+            transform="f_location_avg_fare"),
+    Feature(name="f_loc_max",
+            feature_type=FLOAT,
+            key=[key],
+            transform="f_location_max_fare"),
+    ]
+
+    agg_anchor = FeatureAnchor(name="testTimePartitionFeatures",
+                           source=batch_source,
+                           features=agg_features)
+    client.build_features(anchor_list=[agg_anchor])
+    return client
 
 def snowflake_test_setup(config_path: str):
     now = datetime.now()

From 83b79c9f894b734ff0596bfcbb343d430a904338 Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Mon, 17 Oct 2022 01:32:25 -0700
Subject: [PATCH 25/68] Setting up component governance pipeline (#655)

[skip ci]
---
 azure-pipelines.yml | 15 +++++++++++++++
 1 file changed, 15 insertions(+)
 create mode 100644 azure-pipelines.yml

diff --git a/azure-pipelines.yml b/azure-pipelines.yml
new file mode 100644
index 000000000..e5808aff2
--- /dev/null
+++ b/azure-pipelines.yml
@@ -0,0 +1,15 @@
+# Component Governance Pipeline
+# Runs the Feathr code through Component Governance Detection tool and publishes the result under compliance tab.
+
+trigger:
+- main
+
+pool:
+  vmImage: ubuntu-latest
+
+steps:
+- task: ComponentGovernanceComponentDetection@0
+  inputs:
+    scanType: 'Register'
+    verbosity: 'Verbose'
+    alertWarningLevel: 'High'
\ No newline at end of file

From b03689862857f6bae9bea7b8d148b4349bd8b6d6 Mon Sep 17 00:00:00 2001
From: Xiaoyong Zhu <xiaoyongzhu@users.noreply.github.com>
Date: Mon, 17 Oct 2022 18:41:46 -0700
Subject: [PATCH 26/68] Add docs to explain on feature materialization behavior
 (#688)

* Update materializing-features.md

* Update materializing-features.md
---
 docs/concepts/materializing-features.md | 50 +++++++++++++++++++++++++
 1 file changed, 50 insertions(+)

diff --git a/docs/concepts/materializing-features.md b/docs/concepts/materializing-features.md
index eacf980ff..3c31124e2 100644
--- a/docs/concepts/materializing-features.md
+++ b/docs/concepts/materializing-features.md
@@ -161,3 +161,53 @@ More reference on the APIs:
 
 - [MaterializationSettings API](https://feathr.readthedocs.io/en/latest/feathr.html#feathr.MaterializationSettings)
 - [HdfsSink API](https://feathr.readthedocs.io/en/latest/feathr.html#feathr.HdfsSource)
+
+## Expected behavior on Feature Materialization
+
+When end users materialize features to a sink, what is the expected behavior?
+
+It seems to be a straightforward question, but actually it is not. Basically when end users want to materialize a feature, Feathr is expecting that: For a certain entity key (say a user_id), there will be multiple features (say user_total_gift_card_balance, and user_purchase_in_last_week). So two checks will be performed:
+
+1. Those features should have the same entity key (say a user_id). You cannot materialize features for two entity keys in the same materialization job (although you can do it in different jobs), for example materializing `uer_total_purchase` and `product_sold_in_last_week` in the same Feathr materialization job.
+2. Those features should all be "aggregated" feature. I.e. they should be a feature which has a type of `WindowAggTransformation`, such as `product_sold_in_last_week`, or `user_latest_total_gift_card_balance`.
+
+The first constraint is pretty straightforward to explain - since when Feathr materializes certain features, they are used to describe certain aspects of a given entity such as user. Describing `product_sold_in_last_week` would not make sense for users.
+
+The second constraint is a bit more interesting. For example, you have defined `user_total_gift_card_balance` and it has different value for the same user across different time, say the corresponding value is 40,30,20,20 for the last 4 days, like below.
+Original data:
+
+| UserId | user_total_gift_card_balance | Date       |
+| ------ | ---------------------------- | ---------- |
+| 1      | 40                           | 2022/01/01 |
+| 1      | 30                           | 2022/01/02 |
+| 1      | 20                           | 2022/01/03 |
+| 1      | 20                           | 2022/01/04 |
+| 2      | 40                           | 2022/01/01 |
+| 2      | 30                           | 2022/01/02 |
+| 2      | 20                           | 2022/01/03 |
+| 2      | 20                           | 2022/01/04 |
+| 3      | 40                           | 2022/01/01 |
+| 3      | 30                           | 2022/01/02 |
+| 3      | 20                           | 2022/01/03 |
+| 3      | 20                           | 2022/01/04 |
+
+However, the materialized features have no dates associated with them. I.e. the materialized result should be something like this:
+
+| UserId | user_total_gift_card_balance |
+| ------ | ---------------------------- |
+| 1      | ?                            |
+| 2      | ?                            |
+| 3      | ?                            |
+
+When you ask Feathr to "materialize" `user_total_gift_card_balance` for you, there's only one value that can be materialized, since the materialized feature does not have a date associated with them. So the problem is - for a given `user_id`, only one `user_total_gift_card_balance` can be its feature. Which value you are choosing out of the 4 values? A random value? The latest value?
+
+It might be natural to think that "we should materialize the latest feature", and that behavior, by definition, is an "aggregation" operation, since we have 4 values for a given `user_id` but we are only materializing and using one of them. In that case, Feathr asks you to explicitly say that you want to materialize the latest feature (i.e. by using [Point-in-time Join](./point-in-time-join.md))
+
+```python
+feature = Feature(name="user_total_gift_card_balance",
+            key=UserId,
+            feature_type=FLOAT,
+            transform=WindowAggTransformation(agg_expr="gift_card_balance",
+                                              agg_func="LATEST",
+                                              window="7d"))
+```
\ No newline at end of file

From 5030eee7979973b979045773d0c7c0f429ac937d Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Tue, 18 Oct 2022 15:08:39 +0800
Subject: [PATCH 27/68] Fix protobuf version (#711)

* Fix protobuf version

* quick fix

Co-authored-by: enya-yx <enya@v-ellinlu-2.fareast.corp.microsoft.com>
---
 feathr_project/setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index 47d105061..f36ba18b0 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -37,7 +37,7 @@
         "python-snappy<=0.6.1",
         "deltalake>=0.6.2",
         "graphlib_backport<=1.0.3",
-        "protobuf==3.*",
+        "protobuf<=3.19.4,>=3.0.0",
         "confluent-kafka<=1.9.2",
         "databricks-cli<=0.17.3",
         "avro<=1.11.1",

From aad580dc580364664a3eefac3321523213313934 Mon Sep 17 00:00:00 2001
From: Enya-Yx <108409954+enya-yx@users.noreply.github.com>
Date: Tue, 18 Oct 2022 22:45:15 +0800
Subject: [PATCH 28/68] Add some notes based on on-call issues (#753)

* Add some notes based on on-call issues

* quick fix

Co-authored-by: enya-yx <enya@v-ellinlu-2.fareast.corp.microsoft.com>
---
 docs/concepts/feature-registry.md                  | 2 ++
 docs/how-to-guides/feathr-configuration-and-env.md | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/docs/concepts/feature-registry.md b/docs/concepts/feature-registry.md
index 9bc00b275..112fa1c4b 100644
--- a/docs/concepts/feature-registry.md
+++ b/docs/concepts/feature-registry.md
@@ -74,6 +74,8 @@ client.register_features()
 all_features = client.list_registered_features(project_name=client.project_name)
 ```
 
+Please avoid applying a same name to different features under a certain project. Since it will be treated as updating an exsiting project which is not supported by feathr and will cause errors.
+
 ### Reuse Features from Existing Registry
 
 The feature producers can just let the feature consumers know which features exist so the feature consumers can reuse them. For feature consumers, they can reuse existing features from the registry. The whole project can be retrieved to local environment by calling this API `client.get_features_from_registry` with a project name. This encourage feature reuse across organizations. For example, end users of a feature just need to read all feature definitions from the existing projects, then use a few features from the projects and join those features with a new dataset you have.
diff --git a/docs/how-to-guides/feathr-configuration-and-env.md b/docs/how-to-guides/feathr-configuration-and-env.md
index e4d393a43..e5c6b761a 100644
--- a/docs/how-to-guides/feathr-configuration-and-env.md
+++ b/docs/how-to-guides/feathr-configuration-and-env.md
@@ -64,7 +64,7 @@ Feathr will get the configurations in the following order:
 | SPARK_CONFIG__SPARK_RESULT_OUTPUT_PARTS             | Configure number of parts for the spark output for feature generation job                                                                                                                                                                                                          | Required                                                                  |
 | SPARK_CONFIG__AZURE_SYNAPSE__DEV_URL                  | Dev URL to the synapse cluster. Usually it's something like `https://yourclustername.dev.azuresynapse.net`                                                                                                                                                                         | Required if using Azure Synapse                                           |
 | SPARK_CONFIG__AZURE_SYNAPSE__POOL_NAME                | name of the spark pool that you are going to use                                                                                                                                                                                                                                   | Required if using Azure Synapse                                           |
-| SPARK_CONFIG__AZURE_SYNAPSE__WORKSPACE_DIR            | A location that Synapse has access to. This workspace dir stores all the required configuration files and the jar resources. All the feature definitions will be uploaded here                                                                                                     | Required if using Azure Synapse                                           |
+| SPARK_CONFIG__AZURE_SYNAPSE__WORKSPACE_DIR            | A location that Synapse has access to. This workspace dir stores all the required configuration files and the jar resources. All the feature definitions will be uploaded here. Suggest to use an empty dir for a new spark job to avoid conflicts.                                                                                                     | Required if using Azure Synapse                                           |
 | SPARK_CONFIG__AZURE_SYNAPSE__EXECUTOR_SIZE            | Specifies the executor size for the Azure Synapse cluster. Currently the options are `Small`, `Medium`, `Large`.                                                                                                                                                                   | Required if using Azure Synapse                                           |
 | SPARK_CONFIG__AZURE_SYNAPSE__EXECUTOR_NUM             | Specifies the number of executors for the Azure Synapse cluster                                                                                                                                                                                                                    | Required if using Azure Synapse                                           |
 | SPARK_CONFIG__AZURE_SYNAPSE__FEATHR_RUNTIME_LOCATION  | Specifies the Feathr runtime location. Support local paths, path start with `http(s)://`, and paths start with `abfss:/`. If not set, will use the [Feathr package published in Maven](https://search.maven.org/artifact/com.linkedin.feathr/feathr_2.12).                         | Required if using Azure Synapse                                           |

From 4b9b4940bf3e8a40d9fc720a8af297a9ea8adafc Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Wed, 19 Oct 2022 13:28:50 +0800
Subject: [PATCH 29/68] Refine spark runtime error message (#755)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 feathr_project/feathr/client.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/feathr_project/feathr/client.py b/feathr_project/feathr/client.py
index 1f77d61e0..b21c15549 100644
--- a/feathr_project/feathr/client.py
+++ b/feathr_project/feathr/client.py
@@ -111,7 +111,7 @@ def __init__(self, config_path:str = "./feathr_config.yaml", local_workspace_dir
         self.credential = credential
         if self.spark_runtime not in {'azure_synapse', 'databricks', 'local'}:
             raise RuntimeError(
-                'Only \'azure_synapse\' and \'databricks\' are currently supported.')
+                f'{self.spark_runtime} is not supported. Only \'azure_synapse\', \'databricks\' and \'local\' are currently supported.')
         elif self.spark_runtime == 'azure_synapse':
             # Feathr is a spark-based application so the feathr jar compiled from source code will be used in the
             # Spark job submission. The feathr jar hosted in cloud saves the time users needed to upload the jar from

From b8e3b27189a969744d636d0be8945559430ab2ef Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Tue, 18 Oct 2022 22:58:46 -0700
Subject: [PATCH 30/68] Serialization bug due to version incompatibility
 between azure-core and msrest (#763)

* Adding DevSkim linter to Github actions

* Fix in ARM template to pull latest tagged release image from dockerhub

* Removing dev skim file from this branch

* Fixing linkedin org reference

* Removing the docker index url from dockerhub image name as it seems to cause problem with the update

* Adding to the right file, had a dockerhub workflow file with different name

* Adding debug statements to test udf issue on Synapse

* Adding more print statements

* Pinning msrest version to work with pinned version of azure-core

* Removing debug code from previous branch
---
 feathr_project/setup.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index f36ba18b0..7ecd24ecb 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -51,6 +51,10 @@
         # https://github.com/Azure/azure-sdk-for-python/pull/22891
         # using a version lower than that to workaround this issue.
         "azure-core<=1.22.1",
+        # azure-core 1.22.1 is dependent on msrest==0.6.21, if an environment(AML) has a different version of azure-core (say 1.24.0), 
+        # it brings a different version of msrest(0.7.0) which is incompatible with azure-core==1.22.1. Hence we need to pin it.
+        # See this for more details: https://github.com/Azure/azure-sdk-for-python/issues/24765
+        "msrest<=0.6.21",
         "typing_extensions>=4.2.0"
     ],
     tests_require=[  # TODO: This has been depricated

From fa10e721c44c6aeb2e8679614dbf28b1c033b8d7 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Wed, 19 Oct 2022 18:49:30 +0800
Subject: [PATCH 31/68] Unify Python SDK Build Version and decouple Feathr
 Maven Version (#746)

* unify python package version and enable env setting for scala version

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

* update docs and decouple maven version

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

* change version back to 0.8.0 to avoid conflicts

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

* fix typo

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 docs/dev_guide/feathr_overall_release_guide.md |  6 +++---
 feathr_project/feathr/__init__.py              |  7 ++-----
 feathr_project/feathr/constants.py             |  6 +++++-
 feathr_project/feathr/version.py               |  1 +
 feathr_project/setup.py                        | 14 +++++++++++++-
 5 files changed, 24 insertions(+), 10 deletions(-)
 create mode 100644 feathr_project/feathr/version.py

diff --git a/docs/dev_guide/feathr_overall_release_guide.md b/docs/dev_guide/feathr_overall_release_guide.md
index 069f6edf4..0174c8dae 100644
--- a/docs/dev_guide/feathr_overall_release_guide.md
+++ b/docs/dev_guide/feathr_overall_release_guide.md
@@ -31,11 +31,11 @@ Read through the [commit log](https://github.com/feathr-ai/feathr/commits/main)
 ## Code Changes
 Before the release is made, the version needs to be updated in following places
 - [build.sbt](https://github.com/feathr-ai/feathr/blob/main/build.sbt#L3) - For Maven release version
-- [setup.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/setup.py#L10) - For PyPi release version
+- [version.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathr/version.py#L1) - For Feathr version
 - [conf.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/docs/conf.py#L27) - For documentation version
-- [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/test/test_user_workspace/feathr_config.yaml#L84) - To set the spark runtime location for Azure Synapse and Azure Databricks used by test suite.
-- [constants.py](https://github.com/feathr-ai/feathr/blob/73656fe4a57219e99ff6fede10d51a000ae90fa1/feathr_project/feathr/constants.py#L31) - To set the default maven artifact version
+- [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/test/test_user_workspace/feathr_config.yaml#L84) - To set the spark runtime location for Azure Synapse and Azure Databricks used by test suite. Please update all .yaml files under this path. 
 - [azure_resource_provision.json](https://github.com/feathr-ai/feathr/blob/main/docs/how-to-guides/azure_resource_provision.json#L114) - To set the deployment template to pull the latest release image.
+- [constants.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathr/constants.py#L31) - To set the default maven artifact version (Only needed when maven version is **NOT** the same as python sdk version)
 
 ## Triggering automated release pipelines
 Our goal is to automate the release process as much as possible. So far, we have automated the following steps
diff --git a/feathr_project/feathr/__init__.py b/feathr_project/feathr/__init__.py
index 9b0cf0a49..74809fd81 100644
--- a/feathr_project/feathr/__init__.py
+++ b/feathr_project/feathr/__init__.py
@@ -1,5 +1,3 @@
-import pkg_resources
-
 from .client import FeathrClient
 from .spark_provider.feathr_configurations import SparkExecutionConfiguration
 from .definition.feature_derivations import *
@@ -19,6 +17,7 @@
 from .definition.settings import *
 from .utils.job_utils import *
 from .utils.feature_printer import *
+from .version import __version__
 
 # skipped class as they are internal methods:
 # RepoDefinitions, HoconConvertible,
@@ -75,7 +74,5 @@
     'ObservationSettings',
     'FeaturePrinter',
     'SparkExecutionConfiguration',
+    __version__,
  ]
-
-
-__version__ = pkg_resources.require("feathr")[0].version
diff --git a/feathr_project/feathr/constants.py b/feathr_project/feathr/constants.py
index c4cbad7ff..b2222e2b6 100644
--- a/feathr_project/feathr/constants.py
+++ b/feathr_project/feathr/constants.py
@@ -28,7 +28,11 @@
 TYPEDEF_ARRAY_DERIVED_FEATURE=f"array<feathr_derived_feature_{REGISTRY_TYPEDEF_VERSION}>"
 TYPEDEF_ARRAY_ANCHOR_FEATURE=f"array<feathr_anchor_feature_{REGISTRY_TYPEDEF_VERSION}>"
 
-FEATHR_MAVEN_ARTIFACT="com.linkedin.feathr:feathr_2.12:0.8.2"
+# Decouple Feathr MAVEN Version from Feathr Python SDK Version
+import os
+from feathr.version import __version__
+FEATHR_MAVEN_VERSION = os.environ.get("FEATHR_MAVEN_VERSION", __version__)
+FEATHR_MAVEN_ARTIFACT=f"com.linkedin.feathr:feathr_2.12:{FEATHR_MAVEN_VERSION}"
 
 JOIN_CLASS_NAME="com.linkedin.feathr.offline.job.FeatureJoinJob"
 GEN_CLASS_NAME="com.linkedin.feathr.offline.job.FeatureGenJob"
\ No newline at end of file
diff --git a/feathr_project/feathr/version.py b/feathr_project/feathr/version.py
new file mode 100644
index 000000000..807119de6
--- /dev/null
+++ b/feathr_project/feathr/version.py
@@ -0,0 +1 @@
+__version__ = "0.8.0"
\ No newline at end of file
diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index 7ecd24ecb..4f766b4ec 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -1,3 +1,5 @@
+import sys
+import os
 from setuptools import setup, find_packages
 from pathlib import Path
 
@@ -5,9 +7,19 @@
 root_path = Path(__file__).resolve().parent.parent
 long_description = (root_path / "docs/README.md").read_text(encoding="utf8")
 
+try:
+    exec(open("feathr/version.py").read())
+except IOError:
+    print("Failed to load Feathr version file for packaging.",
+          file=sys.stderr)
+    sys.exit(-1)
+
+VERSION = __version__  # noqa
+os.environ["FEATHR_VERSION"] = VERSION   
+
 setup(
     name='feathr',
-    version='0.8.2',
+    version=VERSION,
     long_description=long_description,
     long_description_content_type="text/markdown",
     author_email="feathr-technical-discuss@lists.lfaidata.foundation",

From c0e8bc8ae017d7003210ad96e755f8abb4781543 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Wed, 19 Oct 2022 18:50:39 +0800
Subject: [PATCH 32/68] replace hard code string in notebook and align with
 others (#765)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 docs/samples/product_recommendation_demo_advanced.ipynb | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/samples/product_recommendation_demo_advanced.ipynb b/docs/samples/product_recommendation_demo_advanced.ipynb
index e4c5917a5..b03dccac6 100644
--- a/docs/samples/product_recommendation_demo_advanced.ipynb
+++ b/docs/samples/product_recommendation_demo_advanced.ipynb
@@ -116,7 +116,7 @@
          },
          "outputs": [],
          "source": [
-            "resource_prefix = \"ckim2\""
+            "resource_prefix = \"feathr_resource_prefix\""
          ]
       },
       {
@@ -1214,7 +1214,7 @@
          "widgets": {}
       },
       "kernelspec": {
-         "display_name": "Python 3.9.5 ('base')",
+         "display_name": "Python 3.9.13 64-bit ('3.9.13')",
          "language": "python",
          "name": "python3"
       },
@@ -1228,11 +1228,11 @@
          "name": "python",
          "nbconvert_exporter": "python",
          "pygments_lexer": "ipython3",
-         "version": "3.9.5"
+         "version": "3.9.13"
       },
       "vscode": {
          "interpreter": {
-            "hash": "3d597f4c481aa0f25dceb95d2a0067e73c0966dcbd003d741d821a7208527ecf"
+            "hash": "c5d1b88564ea095927319e95d120a01ba9530a1c584720276480e541fd6461c7"
          }
       }
    },

From 143ff898b6c61666289981948f000012fda822d1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E5=BE=90=E8=BE=B0?= <windoze@0d0a.com>
Date: Thu, 20 Oct 2022 18:39:37 +0800
Subject: [PATCH 33/68] Add flag to enable generation non-agg features (#719)

* Add flag to enable generation non-agg features

* Typo

* Resolve comments
---
 feathr_project/feathr/client.py               | 19 +++++++++-
 .../test/test_azure_snowflake_e2e.py          |  2 +-
 feathr_project/test/test_azure_spark_e2e.py   |  2 +-
 .../test/test_azure_spark_maven_e2e.py        | 37 ++++++++++++++++++-
 .../test/test_feature_materialization.py      |  2 +-
 .../test/test_pyduf_preprocessing_e2e.py      |  2 +-
 6 files changed, 56 insertions(+), 8 deletions(-)

diff --git a/feathr_project/feathr/client.py b/feathr_project/feathr/client.py
index b21c15549..b14bf868e 100644
--- a/feathr_project/feathr/client.py
+++ b/feathr_project/feathr/client.py
@@ -6,6 +6,7 @@
 from typing import Dict, List, Union
 
 from azure.identity import DefaultAzureCredential
+from feathr.definition.transformation import WindowAggTransformation
 from jinja2 import Template
 from pyhocon import ConfigFactory
 import redis
@@ -608,17 +609,31 @@ def _valid_materialize_keys(self, features: List[str], allow_empty_key=False):
                         self.logger.error(f"Inconsistent feature keys. Current keys are {str(keys)}")
                         return False
         return True
-
-    def materialize_features(self, settings: MaterializationSettings, execution_configurations: Union[SparkExecutionConfiguration ,Dict[str,str]] = {}, verbose: bool = False):
+    
+    def materialize_features(self, settings: MaterializationSettings, execution_configurations: Union[SparkExecutionConfiguration ,Dict[str,str]] = {}, verbose: bool = False, allow_materialize_non_agg_feature: bool = False):
         """Materialize feature data
 
         Args:
             settings: Feature materialization settings
             execution_configurations: a dict that will be passed to spark job when the job starts up, i.e. the "spark configurations". Note that not all of the configuration will be honored since some of the configurations are managed by the Spark platform, such as Databricks or Azure Synapse. Refer to the [spark documentation](https://spark.apache.org/docs/latest/configuration.html) for a complete list of spark configurations.
+            allow_materialize_non_agg_feature: Materializing non-aggregated features (the features without WindowAggTransformation) doesn't output meaningful results so it's by default set to False, but if you really want to materialize non-aggregated features, set this to True.
         """
         feature_list = settings.feature_names
         if len(feature_list) > 0 and not self._valid_materialize_keys(feature_list):
             raise RuntimeError(f"Invalid materialization features: {feature_list}, since they have different keys. Currently Feathr only supports materializing features of the same keys.")
+        
+        if not allow_materialize_non_agg_feature:
+            # Check if there are non-aggregation features in the list
+            for fn in feature_list:
+                # Check over anchor features
+                for anchor in self.anchor_list:
+                    for feature in anchor.features:
+                        if feature.name == fn and not isinstance(feature.transform, WindowAggTransformation):
+                            raise RuntimeError(f"Feature {fn} is not an aggregation feature. Currently Feathr only supports materializing aggregation features. If you want to materialize {fn}, please set allow_materialize_non_agg_feature to True.")
+                # Check over derived features
+                for feature in self.derived_feature_list:
+                    if feature.name == fn and not isinstance(feature.transform, WindowAggTransformation):
+                        raise RuntimeError(f"Feature {fn} is not an aggregation feature. Currently Feathr only supports materializing aggregation features. If you want to materialize {fn}, please set allow_materialize_non_agg_feature to True.")
 
         # Collect secrets from sinks
         secrets = []
diff --git a/feathr_project/test/test_azure_snowflake_e2e.py b/feathr_project/test/test_azure_snowflake_e2e.py
index c84aa9153..17474ab1b 100644
--- a/feathr_project/test/test_azure_snowflake_e2e.py
+++ b/feathr_project/test/test_azure_snowflake_e2e.py
@@ -30,7 +30,7 @@ def test_feathr_online_store_agg_features():
                                    feature_names=['f_snowflake_call_center_division_name',
                                                   'f_snowflake_call_center_zipcode'],
                                    backfill_time=backfill_time)
-    client.materialize_features(settings)
+    client.materialize_features(settings, allow_materialize_non_agg_feature=True)
     # just assume the job is successful without validating the actual result in Redis. Might need to consolidate
     # this part with the test_feathr_online_store test case
     client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
diff --git a/feathr_project/test/test_azure_spark_e2e.py b/feathr_project/test/test_azure_spark_e2e.py
index 9e452d2d0..e82e0efe9 100644
--- a/feathr_project/test/test_azure_spark_e2e.py
+++ b/feathr_project/test/test_azure_spark_e2e.py
@@ -153,7 +153,7 @@ def test_feathr_online_store_non_agg_features():
                                        feature_names=["f_gen_trip_distance", "f_gen_is_long_trip_distance", "f1", "f2", "f3", "f4", "f5", "f6"],
                                        backfill_time=backfill_time)
 
-    client.materialize_features(settings)
+    client.materialize_features(settings, allow_materialize_non_agg_feature=True)
     # just assume the job is successful without validating the actual result in Redis. Might need to consolidate
     # this part with the test_feathr_online_store test case
     client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
diff --git a/feathr_project/test/test_azure_spark_maven_e2e.py b/feathr_project/test/test_azure_spark_maven_e2e.py
index b8e7cefb0..6b93bb7a8 100644
--- a/feathr_project/test/test_azure_spark_maven_e2e.py
+++ b/feathr_project/test/test_azure_spark_maven_e2e.py
@@ -3,8 +3,12 @@
 from pathlib import Path
 
 from feathr import (BackfillTime, MaterializationSettings)
-from feathr import RedisSink
+# from feathr import *
 from feathr.client import FeathrClient
+from feathr.definition.dtype import ValueType
+from feathr.definition.query_feature_list import FeatureQuery
+from feathr.definition.settings import ObservationSettings
+from feathr.definition.typed_key import TypedKey
 from test_fixture import (basic_test_setup, get_online_test_table_name)
 from test_utils.constants import Constants
 
@@ -22,6 +26,35 @@ def test_feathr_online_store_agg_features():
     # Maven package as the dependency and `noop.jar` as the main file
     client: FeathrClient = basic_test_setup(os.path.join(test_workspace_dir, "feathr_config_maven.yaml"))
 
+    
+    
+    location_id = TypedKey(key_column="DOLocationID",
+                            key_column_type=ValueType.INT32,
+                            description="location id in NYC",
+                            full_name="nyc_taxi.location_id")
+
+    feature_query = FeatureQuery(
+        feature_list=["f_location_avg_fare"], key=location_id)
+    settings = ObservationSettings(
+        observation_path="wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04.csv",
+        event_timestamp_column="lpep_dropoff_datetime",
+        timestamp_format="yyyy-MM-dd HH:mm:ss")
+
+    now = datetime.now()
+    # set output folder based on different runtime
+    if client.spark_runtime == 'databricks':
+        output_path = ''.join(['dbfs:/feathrazure_cijob','_', str(now.minute), '_', str(now.second), ".avro"])
+    else:
+        output_path = ''.join(['abfss://xchfeathrtest4fs@xchfeathrtest4sto.dfs.core.windows.net/demo_data/output','_', str(now.minute), '_', str(now.second), ".avro"])
+
+
+    client.get_offline_features(observation_settings=settings,
+                                feature_query=feature_query,
+                                output_path=output_path)
+
+    # assuming the job can successfully run; otherwise it will throw exception
+    client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
+    return
     backfill_time = BackfillTime(start=datetime(
         2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))
     redisSink = RedisSink(table_name=online_test_table)
@@ -51,4 +84,4 @@ def test_feathr_online_store_agg_features():
     assert res['239'][0] != None
     assert res['239'][1] != None
     assert res['265'][0] != None
-    assert res['265'][1] != None
\ No newline at end of file
+    assert res['265'][1] != None
diff --git a/feathr_project/test/test_feature_materialization.py b/feathr_project/test/test_feature_materialization.py
index edd9bb537..e8100578c 100644
--- a/feathr_project/test/test_feature_materialization.py
+++ b/feathr_project/test/test_feature_materialization.py
@@ -236,7 +236,7 @@ def test_delete_feature_from_redis():
                                            "f_day_of_week"
                                        ],
                                        backfill_time=backfill_time)
-    client.materialize_features(settings)
+    client.materialize_features(settings, allow_materialize_non_agg_feature=True)
     
     client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
     
diff --git a/feathr_project/test/test_pyduf_preprocessing_e2e.py b/feathr_project/test/test_pyduf_preprocessing_e2e.py
index 9ac9c1917..83ace12ea 100644
--- a/feathr_project/test/test_pyduf_preprocessing_e2e.py
+++ b/feathr_project/test/test_pyduf_preprocessing_e2e.py
@@ -103,7 +103,7 @@ def test_non_swa_feature_gen_with_offline_preprocessing():
                                            "f_day_of_week"
                                        ],
                                        backfill_time=backfill_time)
-    client.materialize_features(settings)
+    client.materialize_features(settings, allow_materialize_non_agg_feature=True)
     # just assume the job is successful without validating the actual result in Redis. Might need to consolidate
     # this part with the test_feathr_online_store test case
     client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)

From 59e4ccf0d7a902a96faf592921620de5486769d6 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Mon, 24 Oct 2022 10:25:34 +0800
Subject: [PATCH 34/68] rollback 0.8.2 version bump PR (#771)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 build.sbt                                                     | 2 +-
 docs/how-to-guides/azure_resource_provision.json              | 2 +-
 feathr_project/test/test_user_workspace/feathr_config.yaml    | 4 ++--
 .../test_user_workspace/feathr_config_registry_purview.yaml   | 4 ++--
 .../feathr_config_registry_purview_rbac.yaml                  | 4 ++--
 .../test/test_user_workspace/feathr_config_registry_sql.yaml  | 4 ++--
 .../test_user_workspace/feathr_config_registry_sql_rbac.yaml  | 4 ++--
 7 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/build.sbt b/build.sbt
index d85f99016..2919ddae6 100644
--- a/build.sbt
+++ b/build.sbt
@@ -2,7 +2,7 @@ import sbt.Keys.publishLocalConfiguration
 
 ThisBuild / resolvers += Resolver.mavenLocal
 ThisBuild / scalaVersion     := "2.12.15"
-ThisBuild / version          := "0.8.2"
+ThisBuild / version          := "0.8.0"
 ThisBuild / organization     := "com.linkedin.feathr"
 ThisBuild / organizationName := "linkedin"
 val sparkVersion = "3.1.3"
diff --git a/docs/how-to-guides/azure_resource_provision.json b/docs/how-to-guides/azure_resource_provision.json
index 6ab77a419..03d175052 100644
--- a/docs/how-to-guides/azure_resource_provision.json
+++ b/docs/how-to-guides/azure_resource_provision.json
@@ -111,7 +111,7 @@
       "destinationBacpacBlobUrl": "[concat('https://',variables('dlsName'),'.blob.core.windows.net/',variables('dlsFsName'),'/',variables('bacpacBlobName'))]",
       "bacpacDeploymentScriptName": "CopyBacpacFile",
       "bacpacDbExtensionName": "registryRbacDbImport",
-      "preBuiltdockerImage": "feathrfeaturestore/feathr-registry:releases-v0.8.2"
+      "preBuiltdockerImage": "feathrfeaturestore/feathr-registry:releases-v0.8.0"
     },
     "functions": [],
     "resources": [
diff --git a/feathr_project/test/test_user_workspace/feathr_config.yaml b/feathr_project/test/test_user_workspace/feathr_config.yaml
index b0f2b259c..e67c803ef 100644
--- a/feathr_project/test/test_user_workspace/feathr_config.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config.yaml
@@ -82,7 +82,7 @@ spark_config:
     # Feathr Job configuration. Support local paths, path start with http(s)://, and paths start with abfs(s)://
     # this is the default location so end users don't have to compile the runtime again.
     # feathr_runtime_location: wasbs://public@azurefeathrstorage.blob.core.windows.net/feathr-assembly-LATEST.jar
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     # workspace instance
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
@@ -93,7 +93,7 @@ spark_config:
     # Feathr Job location. Support local paths, path start with http(s)://, and paths start with dbfs:/
     work_dir: 'dbfs:/feathr_getting_started'
     # this is the default location so end users don't have to compile the runtime again.
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
index 003e424eb..f716da0b4 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
index 0722a34d8..c842bc702 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
index 507b096cb..dcb73d827 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
index 9403cb190..29c6889e8 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.2.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
 
 online_store:
   redis:

From 6a3a0443336b28a2548fed4c2664ed78337e82a3 Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Mon, 24 Oct 2022 08:07:54 +0530
Subject: [PATCH 35/68] Refactor Product Recommendation sample notebook  (#743)

* Adding DevSkim linter to Github actions

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Removing devskim file

* Restructuring the Prod Reco sample

* Adjusting headings

* Minor changes

* Removing changes to docker publish file

* Addressing PR comments, moving Product recommendation notebook sample to Synapse folder since it is strongly tied to Synapse

* Addressing PR comments

* Fixing images

* Removing the need to pass email id as we could directly compute object Id using az command, also making CLI instructions clearer that it is for advance users
---
 .../product_recommendation_demo.ipynb         | 316 ++++++++----------
 1 file changed, 140 insertions(+), 176 deletions(-)
 rename docs/samples/{ => azure_synapse}/product_recommendation_demo.ipynb (69%)

diff --git a/docs/samples/product_recommendation_demo.ipynb b/docs/samples/azure_synapse/product_recommendation_demo.ipynb
similarity index 69%
rename from docs/samples/product_recommendation_demo.ipynb
rename to docs/samples/azure_synapse/product_recommendation_demo.ipynb
index 44febb062..e93860269 100644
--- a/docs/samples/product_recommendation_demo.ipynb
+++ b/docs/samples/azure_synapse/product_recommendation_demo.ipynb
@@ -4,26 +4,32 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "# Demo Notebook: Feathr Feature Store on Azure\n",
+        "# Product Recommendation with Feathr on Azure\n",
         "\n",
         "This notebook demonstrates how Feathr Feature Store can simplify and empower your model training and inference. You will learn:\n",
         "\n",
         "1. Define sharable features using Feathr API\n",
-        "2. Create a training dataset via point-in-time feature join with Feathr API\n",
-        "3. Materialize features to online store and then retrieve them with Feathr API"
+        "2. Register features with register API.\n",
+        "3. Create a training dataset via point-in-time feature join with Feathr API\n",
+        "4. Materialize features to online store and then retrieve them with Feathr API\n",
+        "\n",
+        "In this tutorial, we use Feathr to create a model that predicts users' product rating. "
       ]
     },
     {
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## Prerequisite: Use Quick Start Template to Provision Azure Resources\n",
+        "## 1. Prerequisite: Use Azure Resource Manager(ARM) to Provision Azure Resources\n",
         "\n",
         "First step is to provision required cloud resources if you want to use Feathr. Feathr provides a python based client to interact with cloud resources.\n",
         "\n",
-        "Please follow the steps [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to provision required cloud resources. Due to the complexity of the possible cloud environment, it is almost impossible to create a script that works for all the use cases. Because of this, [azure_resource_provision.sh](https://github.com/feathr-ai/feathr/blob/main/docs/how-to-guides/azure_resource_provision.sh) is a full end to end command line to create all the required resources, and you can tailor the script as needed, while [the companion documentation](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) can be used as a complete guide for using that shell script. \n",
+        "Please follow the steps [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to provision required cloud resources. This will create a new resource group and deploy the needed Azure resources in it. \n",
         "\n",
+        "If you already have an existing resource group and only want to install few resources manually you can refer to the cli documentation [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html). It provides CLI commands to install the needed resources. \n",
+        "**Please Note: CLI documentation is for advance users since there are lot of configurations and role assignment that would have to be done manually so it won't work out of box and should just be used for reference. ARM template is the preferred way to deploy.**\n",
         "\n",
+        "The below architecture diagram represents how different resources interact with each other\n",
         "![Architecture](https://github.com/feathr-ai/feathr/blob/main/docs/images/architecture.png?raw=true)"
       ]
     },
@@ -31,11 +37,9 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## Prerequisite: Install Feathr and Import Dependencies\n",
-        "\n",
-        "Install Feathr using pip:\n",
+        "## 2. Prerequisite: Login to Azure and Install Feathr\n",
         "\n",
-        "`pip install -U feathr pandavro scikit-learn`"
+        "Login to Azure with a device code (You will see instructions in the output once you execute the cell):"
       ]
     },
     {
@@ -44,53 +48,14 @@
       "metadata": {},
       "outputs": [],
       "source": [
-        "# Import Dependencies\n",
-        "import glob\n",
-        "import os\n",
-        "import tempfile\n",
-        "from datetime import datetime, timedelta\n",
-        "from math import sqrt\n",
-        "\n",
-        "import pandas as pd\n",
-        "import pandavro as pdx\n",
-        "from feathr import FeathrClient\n",
-        "from feathr import BOOLEAN, FLOAT, INT32, ValueType\n",
-        "from feathr import Feature, DerivedFeature, FeatureAnchor\n",
-        "from feathr import BackfillTime, MaterializationSettings\n",
-        "from feathr import FeatureQuery, ObservationSettings\n",
-        "from feathr import RedisSink\n",
-        "from feathr import INPUT_CONTEXT, HdfsSource\n",
-        "from feathr import WindowAggTransformation\n",
-        "from feathr import TypedKey\n",
-        "from sklearn.metrics import mean_squared_error\n",
-        "from sklearn.model_selection import train_test_split\n",
-        "from azure.identity import DefaultAzureCredential\n",
-        "from azure.keyvault.secrets import SecretClient"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Prerequisite: Configure the required environment with Feathr Quick Start Template\n",
-        "\n",
-        "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. Run the code below to install Feathr, login to Azure to get the required credentials to access more cloud resources."
+        "! az login --use-device-code"
       ]
     },
     {
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "**REQUIRED STEP: Fill in the resource prefix when provisioning the resources**"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "resource_prefix = \"feathr_resource_prefix\""
+        "Install Feathr and dependencies to run this notebook."
       ]
     },
     {
@@ -99,14 +64,14 @@
       "metadata": {},
       "outputs": [],
       "source": [
-        "! pip install feathr azure-cli  pandavro scikit-learn"
+        "%pip install -U feathr pandavro scikit-learn"
       ]
     },
     {
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "Login to Azure with a device code (You will see instructions in the output):"
+        "Import Dependencies to make sure everything is installed correctly"
       ]
     },
     {
@@ -115,7 +80,27 @@
       "metadata": {},
       "outputs": [],
       "source": [
-        "! az login --use-device-code"
+        "import glob\n",
+        "import os\n",
+        "import tempfile\n",
+        "from datetime import datetime, timedelta\n",
+        "from math import sqrt\n",
+        "\n",
+        "import pandas as pd\n",
+        "import pandavro as pdx\n",
+        "from feathr import FeathrClient\n",
+        "from feathr import BOOLEAN, FLOAT, INT32, ValueType\n",
+        "from feathr import Feature, DerivedFeature, FeatureAnchor\n",
+        "from feathr import BackfillTime, MaterializationSettings\n",
+        "from feathr import FeatureQuery, ObservationSettings\n",
+        "from feathr import RedisSink\n",
+        "from feathr import INPUT_CONTEXT, HdfsSource\n",
+        "from feathr import WindowAggTransformation\n",
+        "from feathr import TypedKey\n",
+        "from sklearn.metrics import mean_squared_error\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "from azure.identity import AzureCliCredential\n",
+        "from azure.keyvault.secrets import SecretClient"
       ]
     },
     {
@@ -123,20 +108,19 @@
       "metadata": {},
       "source": [
         "\n",
-        "**Permission**\n",
+        "## 3. Prerequisite: Set the required permissions\n",
         "\n",
-        "To proceed with the following steps, you may need additional permission: permission to access the keyvault, permission to access the Storage Blob as a Contributor and permission to submit jobs to Synapse cluster. Skip this step if you have already given yourself the access. Otherwise, run the following lines of command in the Cloud Shell before running the cell below.\n",
+        "Before you proceed further, you would need additional permissions: permission to access the keyvault, permission to access the Storage Blob as a Contributor and permission to submit jobs to Synapse cluster. Run the following lines of command in the [Cloud Shell](https://shell.azure.com) before running the cells below. Please replace the resource_prefix with the prefix you used in ARM template deployment.\n",
         "\n",
         "```\n",
-        "userId=<email_id_of_account_requesting_access>\n",
-        "resource_prefix=<resource_prefix>\n",
-        "synapse_workspace_name=\"${resource_prefix}syws\"\n",
-        "keyvault_name=\"${resource_prefix}kv\"\n",
-        "objectId=$(az ad user show --id $userId --query id -o tsv)\n",
-        "az keyvault update --name $keyvault_name --enable-rbac-authorization false\n",
-        "az keyvault set-policy -n $keyvault_name --secret-permissions get list --object-id $objectId\n",
-        "az role assignment create --assignee $userId --role \"Storage Blob Data Contributor\"\n",
-        "az synapse role assignment create --workspace-name $synapse_workspace_name --role \"Synapse Contributor\" --assignee $userId\n",
+        "    resource_prefix=\"YOUR_RESOURCE_PREFIX\"\n",
+        "    synapse_workspace_name=\"${resource_prefix}syws\"\n",
+        "    keyvault_name=\"${resource_prefix}kv\"\n",
+        "    objectId=$(az ad signed-in-user show --query id -o tsv)\n",
+        "    az keyvault update --name $keyvault_name --enable-rbac-authorization false\n",
+        "    az keyvault set-policy -n $keyvault_name --secret-permissions get list --object-id $objectId\n",
+        "    az role assignment create --assignee $userId --role \"Storage Blob Data Contributor\"\n",
+        "    az synapse role assignment create --workspace-name $synapse_workspace_name --role \"Synapse Contributor\" --assignee $userId\n",
         "```\n"
       ]
     },
@@ -144,7 +128,12 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "Get all the required credentials from Azure KeyVault"
+        "# 4. Prerequisite: Feathr Configuration\n",
+        "\n",
+        "### Setting the environment variables\n",
+        "Set the environment variables that will be used by Feathr as configuration. Feathr supports configuration via enviroment variables and yaml, you can read more about it [here](https://feathr-ai.github.io/feathr/how-to-guides/feathr-configuration-and-env.html).\n",
+        "\n",
+        "**Fill in the `resource_prefix` that you used while provisioning the resources in Step 1 using ARM.**"
       ]
     },
     {
@@ -153,44 +142,49 @@
       "metadata": {},
       "outputs": [],
       "source": [
-        "# Get all the required credentials from Azure Key Vault\n",
-        "key_vault_name=resource_prefix+\"kv\"\n",
-        "synapse_workspace_url=resource_prefix+\"syws\"\n",
-        "adls_account=resource_prefix+\"dls\"\n",
-        "adls_fs_name=resource_prefix+\"fs\"\n",
-        "purview_name=resource_prefix+\"purview\"\n",
-        "key_vault_uri = f\"https://{key_vault_name}.vault.azure.net\"\n",
-        "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False)\n",
-        "client = SecretClient(vault_url=key_vault_uri, credential=credential)\n",
-        "secretName = \"FEATHR-ONLINE-STORE-CONN\"\n",
-        "retrieved_secret = client.get_secret(secretName).value\n",
-        "\n",
-        "# Get redis credentials; This is to parse Redis connection string.\n",
-        "redis_port=retrieved_secret.split(',')[0].split(\":\")[1]\n",
-        "redis_host=retrieved_secret.split(',')[0].split(\":\")[0]\n",
-        "redis_password=retrieved_secret.split(',')[1].split(\"password=\",1)[1]\n",
-        "redis_ssl=retrieved_secret.split(',')[2].split(\"ssl=\",1)[1]\n",
-        "\n",
-        "# Set the resource link\n",
-        "os.environ['spark_config__azure_synapse__dev_url'] = f'https://{synapse_workspace_url}.dev.azuresynapse.net'\n",
-        "os.environ['spark_config__azure_synapse__pool_name'] = 'spark31'\n",
-        "os.environ['spark_config__azure_synapse__workspace_dir'] = f'abfss://{adls_fs_name}@{adls_account}.dfs.core.windows.net/feathr_project'\n",
-        "os.environ['online_store__redis__host'] = redis_host\n",
-        "os.environ['online_store__redis__port'] = redis_port\n",
-        "os.environ['online_store__redis__ssl_enabled'] = redis_ssl\n",
-        "os.environ['REDIS_PASSWORD']=redis_password\n",
-        "feathr_output_path = f'abfss://{adls_fs_name}@{adls_account}.dfs.core.windows.net/feathr_output'"
+        "RESOURCE_PREFIX = \"YOUR_RESOURCE_PREFIX\" # from ARM deployment in Step 1\n",
+        "FEATHR_PROJECT_NAME=\"YOUR_PROJECT_NAME\" # provide a unique name"
       ]
     },
     {
-      "cell_type": "markdown",
+      "cell_type": "code",
+      "execution_count": null,
       "metadata": {},
+      "outputs": [],
       "source": [
-        "## Prerequisite: Configure the required environment (Skip this step if using the above Quick Start Template)\n",
         "\n",
-        "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. If you use Feathr CLI to create a workspace, you should have a folder with a file called `feathr_config.yaml` in it with all the required configurations. Otherwise, update the configuration below.\n",
+        "# Get name for deployed resources using the resource prefix\n",
+        "KEY_VAULT_NAME=f\"{RESOURCE_PREFIX}kv\"\n",
+        "SYNAPSE_WORKSPACE_NAME=f\"{RESOURCE_PREFIX}syws\"\n",
+        "ADLS_ACCOUNT=f\"{RESOURCE_PREFIX}dls\"\n",
+        "ADLS_FS_NAME=f\"{RESOURCE_PREFIX}fs\"\n",
+        "KEY_VAULT_URI = f\"https://{KEY_VAULT_NAME}.vault.azure.net\"\n",
+        "FEATHR_API_APP = f\"{RESOURCE_PREFIX}webapp\"\n",
+        "\n",
         "\n",
-        "The code below will write this configuration string to a temporary location and load it to Feathr. Please still refer to [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It should also have more explanations on the meaning of each variable."
+        "# Getting the credential object for Key Vault client\n",
+        "credential = AzureCliCredential()\n",
+        "client = SecretClient(vault_url=KEY_VAULT_URI, credential=credential)\n",
+        "\n",
+        "# Getting Redis store's connection string.\n",
+        "retrieved_secret = client.get_secret(\"FEATHR-ONLINE-STORE-CONN\").value\n",
+        "\n",
+        "# Parse Redis connection string\n",
+        "REDIS_PORT=retrieved_secret.split(',')[0].split(\":\")[1]\n",
+        "REDIS_HOST=retrieved_secret.split(',')[0].split(\":\")[0]\n",
+        "REDIS_PASSWORD=retrieved_secret.split(',')[1].split(\"password=\",1)[1]\n",
+        "REDIS_SSL=retrieved_secret.split(',')[2].split(\"ssl=\",1)[1]\n",
+        "# Set password as environment variable.\n",
+        "os.environ['REDIS_PASSWORD']=REDIS_PASSWORD"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Write the configuration as yaml file.\n",
+        "\n",
+        "The code below will write this configuration string to a temporary location and load it to Feathr. Please refer to [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for full list of configuration options and details about them."
       ]
     },
     {
@@ -200,68 +194,38 @@
       "outputs": [],
       "source": [
         "import tempfile\n",
-        "yaml_config = \"\"\"\n",
-        "# Please refer to https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
+        "yaml_config = f\"\"\"\n",
         "api_version: 1\n",
         "project_config:\n",
-        "  project_name: 'feathr_getting_started'\n",
-        "  required_environment_variables:\n",
-        "    - 'REDIS_PASSWORD'\n",
+        "  project_name: '{FEATHR_PROJECT_NAME}'\n",
         "offline_store:\n",
         "# Please set 'enabled' flags as true (false by default) if any of items under the same paths are expected to be visited\n",
         "  adls:\n",
         "    adls_enabled: true\n",
         "  wasb:\n",
         "    wasb_enabled: true\n",
-        "  s3:\n",
-        "    s3_enabled: false\n",
-        "    s3_endpoint: 's3.amazonaws.com'\n",
-        "  jdbc:\n",
-        "    jdbc_enabled: false\n",
-        "    jdbc_database: 'feathrtestdb'\n",
-        "    jdbc_table: 'feathrtesttable'\n",
-        "  snowflake:\n",
-        "    snowflake_enabled: false\n",
-        "    url: \"<replace_with_your_snowflake_account>.snowflakecomputing.com\"\n",
-        "    user: \"<replace_with_your_user>\"\n",
-        "    role: \"<replace_with_your_user_role>\"\n",
         "spark_config:\n",
         "  spark_cluster: 'azure_synapse'\n",
         "  spark_result_output_parts: '1'\n",
         "  azure_synapse:\n",
-        "    dev_url: 'https://feathrazuretest3synapse.dev.azuresynapse.net'\n",
-        "    pool_name: 'spark3'\n",
-        "    workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_getting_started'\n",
+        "    dev_url: 'https://{SYNAPSE_WORKSPACE_NAME}.dev.azuresynapse.net'\n",
+        "    pool_name: 'spark31'\n",
+        "    workspace_dir: 'abfss://{ADLS_FS_NAME}@{ADLS_ACCOUNT}.dfs.core.windows.net/feathr_project'\n",
         "    executor_size: 'Small'\n",
         "    executor_num: 1\n",
-        "  databricks:\n",
-        "    workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net'\n",
-        "    config_template: {'run_name':'','new_cluster':{'spark_version':'9.1.x-scala2.12','node_type_id':'Standard_D3_v2','num_workers':2,'spark_conf':{}},'libraries':[{'jar':''}],'spark_jar_task':{'main_class_name':'','parameters':['']}}\n",
-        "    work_dir: 'dbfs:/feathr_getting_started'\n",
         "online_store:\n",
         "  redis:\n",
-        "    host: 'feathrazuretest3redis.redis.cache.windows.net'\n",
-        "    port: 6380\n",
-        "    ssl_enabled: True\n",
+        "    host: '{REDIS_HOST}'\n",
+        "    port: {REDIS_PORT}\n",
+        "    ssl_enabled: {REDIS_SSL}\n",
         "feature_registry:\n",
-        "  api_endpoint: \"https://feathr-sql-registry.azurewebsites.net/api/v1\"\n",
+        "  api_endpoint: 'https://{FEATHR_API_APP}.azurewebsites.net/api/v1'\n",
         "\"\"\"\n",
+        "\n",
         "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
         "with open(tmp.name, \"w\") as text_file:\n",
         "    text_file.write(yaml_config)\n",
-        "feathr_output_path = f'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_output'"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Prerequisite: Setup necessary environment variables (Skip this step if using the above Quick Start Template)\n",
-        "\n",
-        "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
-        "\n",
-        "To run this notebook, for Azure users, you need REDIS_PASSWORD.\n",
-        "To run this notebook, for Databricks useres, you need DATABRICKS_WORKSPACE_TOKEN_VALUE and REDIS_PASSWORD."
+        "feathr_output_path = f'abfss://{ADLS_FS_NAME}@{ADLS_ACCOUNT}.dfs.core.windows.net/feathr_output'"
       ]
     },
     {
@@ -270,10 +234,10 @@
       "source": [
         "# Define sharable features using Feathr API\n",
         "\n",
-        "In this tutorial, we use Feathr Feature Store to help create a model that predicts users product rating. To make it simple, let's just predict users' rating for ONE product for an e-commerce website. (We have an [advanced demo](./product_recommendation_demo_advanced.ipynb) that predicts ratings for arbitrary products.)\n",
+        "In this tutorial, we use Feathr Feature Store and create a model that predicts users' product rating. To make it simple, let's just predict users' rating for ONE product for an e-commerce website. (We have an [advanced demo](../product_recommendation_demo_advanced.ipynb) that predicts ratings for arbitrary products.)\n",
         "\n",
         "\n",
-        "## Initialize Feathr Client\n",
+        "### Initialize Feathr Client\n",
         "\n",
         "Let's initialize a Feathr client first. The Feathr client provides all the APIs we need to interact with Feathr Feature Store."
       ]
@@ -291,7 +255,7 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## Understand the Raw Datasets\n",
+        "### Understand the Raw Datasets\n",
         "We have 3 raw datasets to work with: one observation dataset(a.k.a. label dataset) and two raw datasets to generate features."
       ]
     },
@@ -305,6 +269,7 @@
         "# Observation dataset usually comes with a event_timestamp to denote when the observation happened.\n",
         "# The label here is product_rating. Our model objective is to predict a user's rating for this product.\n",
         "import pandas as pd\n",
+        "# Public URL hosting mock data\n",
         "pd.read_csv(\"https://azurefeathrstorage.blob.core.windows.net/public/sample_data/product_recommendation_sample/user_observation_mock_data.csv\")"
       ]
     },
@@ -346,7 +311,7 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## What's a Feature in Feathr\n",
+        "### What's a Feature in Feathr\n",
         "A feature is an individual measurable property or characteristic of a phenomenon which is sometimes time-sensitive. \n",
         "\n",
         "In Feathr, feature can be defined by the following characteristics:\n",
@@ -360,7 +325,7 @@
         "1. Feature source: what source data that this feature is based on\n",
         "2. Transformation: what transformation is used to transform the source data into feature. Transformation can be optional when you just want to take a column out from the source data.\n",
         "\n",
-        "(For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md))"
+        "(For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://feathr-ai.github.io/feathr/concepts/feature-definition.html))"
       ]
     },
     {
@@ -456,9 +421,7 @@
       "source": [
         "### Window aggregation features\n",
         "\n",
-        "Using [window aggregations](https://en.wikipedia.org/wiki/Window_function_%28SQL%29) can help us create more powerful features. A window aggregation feature compress large amount of information into one single feature value. Using our raw data as an example, we have the users' purchase history data that might be quite some rows, we want to create a window aggregation feature that represents their last 90 days of average purcahse amount.\n",
-        "\n",
-        "Feathr provides a nice API to help us create such window aggregation features.\n",
+        "Using [window aggregations](https://en.wikipedia.org/wiki/Window_function_%28SQL%29) can help us create more powerful features. A window aggregation feature compresses large amount of information into one single feature value. Using our raw data as an example, we have the user's purchase history data that might be quite some rows, we want to create a window aggregation feature that represents their last 90 days of average purchase amount.\n",
         "\n",
         "To create this window aggregation feature via Feathr, we just need to define the following parameters with `WindowAggTransformation` API:\n",
         "1. `agg_expr`: the field/column you want to aggregate. It can be a ANSI SQL expression. So we just write `cast_float(purchase_amount)`(the raw data might be in string form, let's cast_float).\n",
@@ -509,9 +472,7 @@
         "### Derived Features Section\n",
         "Derived features are features that are computed from other Feathr features. They could be computed from anchored features, or other derived features.\n",
         "\n",
-        "Typical usage includes feature cross(f1 * f2), or computing cosine similarity between two features.\n",
-        "\n",
-        "The syntax works in a similar way."
+        "Typical usage includes feature cross(f1 * f2), or computing cosine similarity between two features. The syntax works in a similar way."
       ]
     },
     {
@@ -532,7 +493,7 @@
       "metadata": {},
       "source": [
         "### Build Features\n",
-        "Lastly, we need to build those features so that it can be consumed later. Note that we have to build both the \"anchor\" and the \"derived\" features."
+        "Lastly, we need to build these features so that they can be consumed later. Note that we have to build both the \"anchor\" and the \"derived\" features."
       ]
     },
     {
@@ -550,12 +511,11 @@
       "metadata": {},
       "source": [
         "### Optional: A Special Type of Feature: Request Feature\n",
-        "For advanced user cases, in some cases, features defined on top of request data(a.k.a. observation data) may have no entity key or timestamp.\n",
-        "It is merely a function/transformation executing against request data at runtime.\n",
-        "For example, the day of week of the request, which is calculated by converting the request UNIX timestamp.\n",
-        "In this case, the `source` section should be `INPUT_CONTEXT` to indicate the source of those defined anchors.\n",
+        "Sometimes features defined on top of request data(a.k.a. observation data) may have no entity key or timestamp. It is merely a function/transformation executing against request data at runtime.\n",
+        "\n",
+        "For example, the day of the week of the request, which is calculated by converting the request UNIX timestamp. In this case, the `source` section should be `INPUT_CONTEXT` to indicate the source of those defined anchors.\n",
         "\n",
-        "We won't cover the details it in this notebook."
+        "We won't cover the details of it in this notebook."
       ]
     },
     {
@@ -564,12 +524,11 @@
       "source": [
         "## Create training data using point-in-time correct feature join\n",
         "\n",
-        "A training dataset usually contains entity id column(s), multiple feature columns, event timestamp column and label/target column. \n",
+        "A training dataset usually contains `entity id` column(s), multiple `feature` columns, event timestamp column and `label/target` column. \n",
         "\n",
-        "To create a training dataset using Feathr, we need to provide a feature join settings to specify\n",
-        "what features and how these features should be joined to the observation data. \n",
+        "To create a training dataset using Feathr, we need to provide a feature join settings to specify what features and how these features should be joined to the observation data. \n",
         "\n",
-        "(To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/point-in-time-join.md))"
+        "(To learn more on this topic, please refer to [Point-in-time Correctness](https://feathr-ai.github.io/feathr/concepts/point-in-time-join.html))."
       ]
     },
     {
@@ -578,12 +537,7 @@
       "metadata": {},
       "outputs": [],
       "source": [
-        "# Synapse and Databricks have different output path format\n",
-        "if feathr_client.spark_runtime == 'databricks':\n",
-        "    output_path = 'dbfs:/feathrazure_test.avro'\n",
-        "else:\n",
-        "    output_path = feathr_output_path\n",
-        "\n",
+        "output_path = feathr_output_path\n",
         "# Features that we want to request\n",
         "feature_query = FeatureQuery(feature_list=[\"feature_user_age\", \n",
         "                                           \"feature_user_tax_rate\", \n",
@@ -606,7 +560,7 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## Download the result and show the result\n",
+        "### Download the result and show the result\n",
         "\n",
         "Let's use the helper function `get_result_df` to download the result and view it:"
       ]
@@ -639,7 +593,7 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## Train a machine learning model\n",
+        "### Train a machine learning model\n",
         "After getting all the features, let's train a machine learning model with the converted feature by Feathr:"
       ]
     },
@@ -694,16 +648,16 @@
         "\n",
         "In the previous section, we demonstrated how Feathr can compute feature value to generate training dataset from feature definition on-they-fly.\n",
         "\n",
-        "Now let's talk about how we can use the trained models. We can use the trained models for offline inference as well as online inference. In both cases, we need features to be feed into the models. For offline inference, you can compute and get the features on-demand; or you can store the computed features to some offline database for later offline inference.\n",
+        "Now let's talk about how we can use the trained models. We can use the trained models for both online and offline inference. In both cases, we need features to be fed into the models. For offline inference, you can compute and get the features on-demand; or you can store the computed features to some offline database for later offline inference.\n",
         "\n",
         "For online inference, we can use Feathr to compute and store the features in the online database. Then use it for online inference when the request comes.\n",
         "\n",
-        "![img](../images/online_inference.jpg)\n",
+        "![img](../../images/online_inference.jpg)\n",
         "\n",
         "\n",
-        "In this section, we will focus on materialize features to online store. For materialization to offline store, you can check out our [user guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/materializing-features.md#materializing-features-to-offline-store).\n",
+        "In this section, we will focus on materialize features to online store. For materialization to offline store, you can check out our [user guide](https://feathr-ai.github.io/feathr/concepts/materializing-features.html#materializing-features-to-offline-store).\n",
         "\n",
-        "We can push the computed features to the online store like below:"
+        "We can push the computed features to the online store(Redis) like below:"
       ]
     },
     {
@@ -729,7 +683,7 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "## Fetch feature value from online store\n",
+        "### Fetch feature value from online store\n",
         "We can then get the features from the online store (Redis) via the client's `get_online_features` or `multi_get_online_features` API."
       ]
     },
@@ -761,7 +715,7 @@
       "source": [
         "### Registering and Fetching features\n",
         "\n",
-        "We can also register the features with an Apache Atlas compatible service, such as Azure Purview, and share the registered features across teams:"
+        "We can also register the features and share them across teams:"
       ]
     },
     {
@@ -771,13 +725,23 @@
       "outputs": [],
       "source": [
         "feathr_client.register_features()\n",
-        "feathr_client.list_registered_features(project_name=\"feathr_getting_started\")"
+        "feathr_client.list_registered_features(project_name=f\"{FEATHR_PROJECT_NAME}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Summary\n",
+        "In this notebook you learnt how to set up Feathr and use it to create features, register features and use those features for model training and inferencing.\n",
+        "\n",
+        "We hope this example gave you a good sense of Feathr's capabilities and how you could leverage it within your organization's MLOps workflow."
       ]
     }
   ],
   "metadata": {
     "kernelspec": {
-      "display_name": "Python 3.9.12 ('ifelse_bug_env': venv)",
+      "display_name": "Python 3.8.13 ('feathrtest')",
       "language": "python",
       "name": "python3"
     },
@@ -791,11 +755,11 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.9.12"
+      "version": "3.8.13"
     },
     "vscode": {
       "interpreter": {
-        "hash": "6a6c366ec8f33a88299a9f856c1a3e4312616abcb6fcf46b22c3da0a923e63af"
+        "hash": "96bbbb728c64ae5eda27ed1c89d74908bf0652fd45caa45cd0ade6bdc0df4d48"
       }
     }
   },

From eb6b9b86c75cf1c7d6e7f35261ded118eb5a8587 Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Tue, 25 Oct 2022 11:48:25 +0800
Subject: [PATCH 36/68] Update role-management page in UI (#751) (#764)

* Update role-management page in UI (#751)

* fix home.css LF file

* fix RoleForm eslint warning

* remove import dayjs

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Change components to arrow function.

Signed-off-by: Boli Guan <ifendoe@gmail.com>

Signed-off-by: Boli Guan <ifendoe@gmail.com>
---
 ui/package-lock.json                          |  10 +-
 ui/package.json                               |   1 +
 ui/src/pages/home/home.css                    |  46 ++---
 .../management/components/RoleForm/index.tsx  | 126 ++++++++++++
 .../management/components/SearchBar/index.tsx |  71 +++++++
 .../components/UserRolesTable/index.tsx       | 190 ++++++++++++++++++
 ui/src/pages/management/management.tsx        |  28 ++-
 ui/src/pages/management/roleManagement.tsx    |  25 ++-
 8 files changed, 461 insertions(+), 36 deletions(-)
 create mode 100644 ui/src/pages/management/components/RoleForm/index.tsx
 create mode 100644 ui/src/pages/management/components/SearchBar/index.tsx
 create mode 100644 ui/src/pages/management/components/UserRolesTable/index.tsx

diff --git a/ui/package-lock.json b/ui/package-lock.json
index b3a0d27d8..28bd6553c 100644
--- a/ui/package-lock.json
+++ b/ui/package-lock.json
@@ -13,6 +13,7 @@
         "antd": "^4.20.2",
         "axios": "^0.27.2",
         "dagre": "^0.8.5",
+        "dayjs": "^1.11.5",
         "react": "^17.0.2",
         "react-dom": "^17.0.2",
         "react-flow-renderer": "^9.7.4",
@@ -6353,8 +6354,9 @@
       }
     },
     "node_modules/dayjs": {
-      "version": "1.11.1",
-      "license": "MIT"
+      "version": "1.11.5",
+      "resolved": "https://registry.npmjs.org/dayjs/-/dayjs-1.11.5.tgz",
+      "integrity": "sha512-CAdX5Q3YW3Gclyo5Vpqkgpj8fSdLQcRuzfX6mC6Phy0nfJ0eGYOeS7m4mt2plDWLAtA4TqTakvbboHvUxfe4iA=="
     },
     "node_modules/debug": {
       "version": "4.3.4",
@@ -20783,7 +20785,9 @@
       "version": "2.28.0"
     },
     "dayjs": {
-      "version": "1.11.1"
+      "version": "1.11.5",
+      "resolved": "https://registry.npmjs.org/dayjs/-/dayjs-1.11.5.tgz",
+      "integrity": "sha512-CAdX5Q3YW3Gclyo5Vpqkgpj8fSdLQcRuzfX6mC6Phy0nfJ0eGYOeS7m4mt2plDWLAtA4TqTakvbboHvUxfe4iA=="
     },
     "debug": {
       "version": "4.3.4",
diff --git a/ui/package.json b/ui/package.json
index 3a211df1f..dc8ee5e7e 100644
--- a/ui/package.json
+++ b/ui/package.json
@@ -8,6 +8,7 @@
     "antd": "^4.20.2",
     "axios": "^0.27.2",
     "dagre": "^0.8.5",
+    "dayjs": "^1.11.5",
     "react": "^17.0.2",
     "react-dom": "^17.0.2",
     "react-flow-renderer": "^9.7.4",
diff --git a/ui/src/pages/home/home.css b/ui/src/pages/home/home.css
index 5c4a3b8a8..308e45367 100644
--- a/ui/src/pages/home/home.css
+++ b/ui/src/pages/home/home.css
@@ -1,23 +1,23 @@
-.home .ant-card {
-  box-shadow: 5px 8px 15px 5px rgba(208, 216, 243, 0.6);
-  border-radius: 8px;
-}
-
-.home .card-meta {
-  display: flex;
-}
-
-.home .card-meta .ant-card-meta-avatar {
-  max-width: 80px;
-  flex-basis: 30%;
-  box-sizing: border-box;
-}
-
-.home .card-meta .ant-card-meta-avatar > span {
-  width: 100%;
-}
-
-.home .card-meta .ant-card-meta-avatar svg {
-  width: 100%;
-  height: auto;
-}
+.home .ant-card {
+  box-shadow: 5px 8px 15px 5px rgba(208, 216, 243, 0.6);
+  border-radius: 8px;
+}
+
+.home .card-meta {
+  display: flex;
+}
+
+.home .card-meta .ant-card-meta-avatar {
+  max-width: 80px;
+  flex-basis: 30%;
+  box-sizing: border-box;
+}
+
+.home .card-meta .ant-card-meta-avatar > span {
+  width: 100%;
+}
+
+.home .card-meta .ant-card-meta-avatar svg {
+  width: 100%;
+  height: auto;
+}
diff --git a/ui/src/pages/management/components/RoleForm/index.tsx b/ui/src/pages/management/components/RoleForm/index.tsx
new file mode 100644
index 000000000..9e073abd8
--- /dev/null
+++ b/ui/src/pages/management/components/RoleForm/index.tsx
@@ -0,0 +1,126 @@
+import React, { forwardRef, useCallback, useEffect, useState } from "react";
+import { Form, Select, Input, Button, message } from "antd";
+import { listUserRole, addUserRole } from "../../../../api";
+
+export interface RoleFormProps {
+  getRole?: (isAdmin: boolean) => void;
+}
+
+const { Item } = Form;
+const { TextArea } = Input;
+
+const RoleOptions = [
+  { label: "Admin", value: "admin" },
+  { label: "Producer", value: "producer" },
+  { label: "Consumer", value: "consumer" },
+];
+
+const ValidateRule = {
+  scope: [{ required: true, message: "Please select scope!" }],
+  userName: [{ required: true, message: "Please input user name!" }],
+  roleName: [{ required: true, message: "Please select role name!" }],
+  reason: [{ required: true, message: "Please input reason!" }],
+};
+
+const RoleForm = (props: RoleFormProps, ref: any) => {
+  const [form] = Form.useForm();
+  const { getRole } = props;
+  const [loading, setLoading] = useState<boolean>(false);
+
+  const [scopeOptions, setScopeOptions] = useState<
+    { label: string; value: string }[]
+  >([]);
+
+  const handleFinish = useCallback(
+    async (values) => {
+      try {
+        setLoading(true);
+        await addUserRole(values);
+        form.resetFields();
+        message.success("User role is created successfully.");
+      } catch {
+        message.error("Failed to create user role.");
+      } finally {
+        setLoading(false);
+      }
+    },
+    [form]
+  );
+
+  const handleInit = useCallback(async () => {
+    try {
+      const result = await listUserRole();
+      if (result.length) {
+        const dataset = new Set(
+          result.reduce(
+            (list: string[], item) => {
+              list.push(item.scope);
+              return list;
+            },
+            ["global"]
+          )
+        );
+        const options = Array.from(dataset).map((item) => {
+          return {
+            label: item,
+            value: item,
+          };
+        });
+        setScopeOptions(options);
+        return true;
+      } else {
+        return false;
+      }
+    } catch {
+      return false;
+    }
+  }, []);
+
+  useEffect(() => {
+    handleInit().then((isAdmin: boolean) => {
+      getRole?.(isAdmin);
+    });
+  }, [handleInit, getRole]);
+
+  return (
+    <Form
+      layout="vertical"
+      form={form}
+      onFinish={handleFinish}
+      style={{ margin: "0 auto", maxWidth: 600 }}
+    >
+      <Item label="Scope" name="scope" rules={ValidateRule.scope}>
+        <Select
+          showSearch
+          placeholder="Select project Name or Global"
+          options={scopeOptions}
+          filterOption={(input: string, option?: any) => {
+            return (option!.value as unknown as string)
+              .toLowerCase()
+              .includes(input.toLowerCase());
+          }}
+        />
+      </Item>
+      <Item label="User Name" name="userName" rules={ValidateRule.userName}>
+        <Input placeholder="Email Account or App Id" maxLength={255} />
+      </Item>
+      <Item label="Role Name" name="roleName" rules={ValidateRule.roleName}>
+        <Select placeholder="Select a role to assign:" options={RoleOptions} />
+      </Item>
+      <Item label="Reason" name="reason" rules={ValidateRule.reason}>
+        <TextArea placeholder="For Audit Purpose" maxLength={50} />
+      </Item>
+      <Item>
+        <Button type="primary" htmlType="submit" loading={loading}>
+          Submit
+        </Button>
+      </Item>
+    </Form>
+  );
+};
+
+const RoleFormComponent = forwardRef<unknown, RoleFormProps>(RoleForm);
+
+RoleFormComponent.displayName = "RoleFormComponent";
+
+export default RoleFormComponent;
diff --git a/ui/src/pages/management/components/SearchBar/index.tsx b/ui/src/pages/management/components/SearchBar/index.tsx
new file mode 100644
index 000000000..64e3b98ec
--- /dev/null
+++ b/ui/src/pages/management/components/SearchBar/index.tsx
@@ -0,0 +1,71 @@
+import React, { forwardRef } from "react";
+import { Form, Select, Input, Button } from "antd";
+import { SearchOutlined } from "@ant-design/icons";
+import { useNavigate } from "react-router-dom";
+
+export interface SearchBarProps {
+  onSearch: (values: any) => void;
+}
+
+const { Item } = Form;
+
+const RoleOptions = [
+  { label: "Admin", value: "admin" },
+  { label: "Producer", value: "producer" },
+  { label: "Consumer", value: "consumer" },
+];
+
+const SearchBar = (props: SearchBarProps, ref: any) => {
+  const [form] = Form.useForm();
+
+  const navigate = useNavigate();
+
+  const { onSearch } = props;
+
+  const onClickRoleAssign = () => {
+    navigate("/role-management");
+  };
+
+  return (
+    <div
+      style={{
+        display: "flex",
+        justifyContent: "space-between",
+        marginBottom: 16,
+      }}
+    >
+      <Form layout="inline" form={form} onFinish={onSearch}>
+        <Item label="Scope" name="scope">
+          <Input
+            placeholder="Scope (Project / Global)"
+            autoComplete="off"
+            allowClear
+            style={{ width: 260 }}
+          />
+        </Item>
+        <Item name="roleName">
+          <Select
+            placeholder="Role Name"
+            allowClear
+            options={RoleOptions}
+            style={{ width: 200 }}
+          />
+        </Item>
+        <Item>
+          <Button type="primary" htmlType="submit" icon={<SearchOutlined />}>
+            Search
+          </Button>
+        </Item>
+      </Form>
+      <Button type="primary" onClick={onClickRoleAssign}>
+        + Create Role Assignment
+      </Button>
+    </div>
+  );
+};
+
+const SearchBarComponent = forwardRef<unknown, SearchBarProps>(SearchBar);
+
+SearchBarComponent.displayName = "SearchBarComponent";
+
+export default SearchBarComponent;
diff --git a/ui/src/pages/management/components/UserRolesTable/index.tsx b/ui/src/pages/management/components/UserRolesTable/index.tsx
new file mode 100644
index 000000000..d264b2691
--- /dev/null
+++ b/ui/src/pages/management/components/UserRolesTable/index.tsx
@@ -0,0 +1,190 @@
+import React, {
+  forwardRef,
+  useCallback,
+  useEffect,
+  useImperativeHandle,
+  useRef,
+  useState,
+} from "react";
+import { Table, Tag, Button, message, Popconfirm } from "antd";
+import { DeleteOutlined } from "@ant-design/icons";
+import { ColumnsType } from "antd/lib/table";
+import dayjs from "dayjs";
+import { UserRole } from "../../../../models/model";
+import { listUserRole, deleteUserRole } from "../../../../api";
+
+export interface UserRolesTableProps {}
+
+export interface UserRolesTableInstance {
+  onSearch?: (values: any) => void;
+}
+
+export interface SearchModel {
+  scope?: string;
+  roleName?: string;
+}
+
+const UserRolesTable = (props: UserRolesTableProps, ref: any) => {
+  const [loading, setLoading] = useState<boolean>(false);
+
+  const [tableData, setTableData] = useState<UserRole[]>([]);
+
+  const searchRef = useRef<SearchModel>();
+
+  const fetchData = useCallback(async () => {
+    setLoading(true);
+    try {
+      let result = await listUserRole();
+      if (searchRef.current) {
+        const { scope, roleName } = searchRef.current;
+        result = result.filter((item) => {
+          let value = true;
+          if (scope) {
+            value = item.scope.includes(scope.toLocaleLowerCase());
+          }
+          if (value && roleName) {
+            value = item.roleName === roleName;
+          }
+          return value;
+        });
+      }
+      result.sort((a: UserRole, b: UserRole) => {
+        return dayjs(b.createTime).diff(
+          dayjs(a.createTime),
+          "milliseconds",
+          true
+        );
+      });
+
+      setTableData(result);
+    } catch {
+      //
+    } finally {
+      setLoading(false);
+    }
+  }, []);
+
+  const onDelete = async (row: UserRole) => {
+    try {
+      await deleteUserRole(row);
+      message.success(`Role ${row.roleName} of user ${row.userName} deleted`);
+      fetchData();
+    } catch {
+      message.error("Failed to delete userrole.");
+    }
+  };
+
+  const columns: ColumnsType<UserRole> = [
+    {
+      title: "Scope (Project / Global)",
+      dataIndex: "scope",
+      ellipsis: true,
+    },
+    {
+      title: "Role",
+      dataIndex: "roleName",
+      width: 120,
+    },
+    {
+      title: "User",
+      dataIndex: "userName",
+      ellipsis: true,
+    },
+    {
+      title: "Permissions",
+      dataIndex: "access",
+      width: 240,
+      render: (col: string[]) => {
+        return col.map((tag) => {
+          let color = tag.length > 5 ? "red" : "green";
+          if (tag === "write") color = "blue";
+          return (
+            <Tag color={color} key={tag}>
+              {tag.toUpperCase()}
+            </Tag>
+          );
+        });
+      },
+    },
+    {
+      title: "Reason",
+      dataIndex: "createReason",
+      ellipsis: true,
+    },
+    {
+      title: "Create By",
+      dataIndex: "createBy",
+      width: 200,
+      ellipsis: true,
+    },
+    {
+      title: "Create Time",
+      dataIndex: "createTime",
+      width: 200,
+      sorter: {
+        compare: (a: UserRole, b: UserRole) => {
+          return dayjs(b.createTime).diff(
+            dayjs(a.createTime),
+            "milliseconds",
+            true
+          );
+        },
+      },
+      render: (col: string) => {
+        return dayjs(col).format("YYYY-MM-DD HH:mm:ss");
+      },
+    },
+    {
+      title: "Action",
+      fixed: "right",
+      width: 130,
+      render: (col: string, record: UserRole) => {
+        return (
+          <Popconfirm
+            placement="left"
+            title="Are you sure to delete?"
+            onConfirm={() => {
+              onDelete(record);
+            }}
+          >
+            <Button danger icon={<DeleteOutlined />}>
+              Delete
+            </Button>
+          </Popconfirm>
+        );
+      },
+    },
+  ];
+
+  useImperativeHandle<any, UserRolesTableInstance>(ref, () => {
+    return {
+      onSearch: (values: SearchModel) => {
+        searchRef.current = values;
+        fetchData();
+      },
+    };
+  });
+
+  useEffect(() => {
+    fetchData();
+  }, [fetchData]);
+
+  return (
+    <Table
+      rowKey="id"
+      loading={loading}
+      columns={columns}
+      dataSource={tableData}
+      scroll={{ x: 1200 }}
+    />
+  );
+};
+
+const UserRolesTableComponent = forwardRef<
+  UserRolesTableInstance,
+  UserRolesTableProps
+>(UserRolesTable);
+
+UserRolesTableComponent.displayName = "UserRolesTableComponent";
+
+export default UserRolesTableComponent;
diff --git a/ui/src/pages/management/management.tsx b/ui/src/pages/management/management.tsx
index 7ceb33dae..79ba50daa 100644
--- a/ui/src/pages/management/management.tsx
+++ b/ui/src/pages/management/management.tsx
@@ -1,15 +1,33 @@
-import React from "react";
-import { Card, Typography } from "antd";
-import UserRoles from "../../components/userRoles";
+import React, { useRef } from "react";
+import { Card, Typography, Alert, Space } from "antd";
+import UserRolesTable, {
+  SearchModel,
+  UserRolesTableInstance,
+} from "./components/UserRolesTable";
+import SearchBar from "./components/SearchBar";
 
 const { Title } = Typography;
 
 const Management = () => {
+  const tableRef = useRef<UserRolesTableInstance>(null);
+
+  const handleSearch = (values: SearchModel) => {
+    tableRef.current?.onSearch?.(values);
+  };
+
   return (
     <div className="page">
       <Card>
-        <Title level={3}>Role Management</Title>
-        <UserRoles />
+        <Space direction="vertical" style={{ width: "100%" }}>
+          <Alert
+            type="info"
+            message="This page is protected by Feathr Access Control. Only Project Admins
+      can retrieve management details and grant or delete user roles."
+          />
+          <Title level={3}>Role Management </Title>
+          <SearchBar onSearch={handleSearch} />
+        </Space>
+        <UserRolesTable ref={tableRef} />
       </Card>
     </div>
   );
diff --git a/ui/src/pages/management/roleManagement.tsx b/ui/src/pages/management/roleManagement.tsx
index c3d36a28e..b8b1b676d 100644
--- a/ui/src/pages/management/roleManagement.tsx
+++ b/ui/src/pages/management/roleManagement.tsx
@@ -1,15 +1,30 @@
-import React from "react";
-import { Card, Typography } from "antd";
-import RoleManagementForm from "../../components/roleManagementForm";
+import React, { useState } from "react";
+import { Card, Typography, Space, Alert } from "antd";
+import RoleForm from "./components/RoleForm";
 
 const { Title } = Typography;
 
 const RoleManagement = () => {
+  const [showAlert, setShowAlert] = useState<boolean>(false);
+
+  const handleRole = (isAdmin: boolean) => {
+    setShowAlert(!isAdmin);
+  };
+
   return (
     <div className="page">
       <Card>
-        <Title level={3}>Role Management</Title>
-        <RoleManagementForm isNew={true} editMode={true} />
+        <Space direction="vertical" style={{ width: "100%" }}>
+          {showAlert && (
+            <Alert
+              type="warning"
+              message="You are not admin of any project. Only Project Admins
+      can retrieve management details and grant or delete user roles."
+            />
+          )}
+          <Title level={3}>Role Management</Title>
+        </Space>
+        <RoleForm getRole={handleRole} />
       </Card>
     </div>
   );

From 5c17dee7478c71b62cb5d9b23afa09b3539b6629 Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Tue, 25 Oct 2022 17:14:04 +0800
Subject: [PATCH 37/68] Create Feature less module in UI code and import alias
 (#768)

* Add craco devDependencies

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Add classnames, @ant-design/icons,eslint-plugin.. dependencies.

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Update .editorconfig and .eslintrc

* Update .editorconfig

Signed-off-by: Boli Guan <ifendoe@gmail.com>

Signed-off-by: Boli Guan <ifendoe@gmail.com>
---
 ui/.editorconfig                    |   10 +
 ui/.eslintrc                        |   30 +-
 ui/.vscode/settings.json            |    3 +
 ui/craco.config.js                  |   51 +
 ui/package-lock.json                | 1360 +++++++++++++++++++++++++--
 ui/package.json                     |   16 +-
 ui/src/index.tsx                    |    2 -
 ui/src/pages/home/home.css          |   23 -
 ui/src/pages/home/home.tsx          |   12 +-
 ui/src/pages/home/index.module.less |   28 +
 ui/src/typings/file.d.ts            |   44 +
 ui/tsconfig.json                    |   17 +-
 12 files changed, 1474 insertions(+), 122 deletions(-)
 create mode 100644 ui/.editorconfig
 create mode 100644 ui/craco.config.js
 delete mode 100644 ui/src/pages/home/home.css
 create mode 100644 ui/src/pages/home/index.module.less
 create mode 100644 ui/src/typings/file.d.ts

diff --git a/ui/.editorconfig b/ui/.editorconfig
new file mode 100644
index 000000000..b5e435a15
--- /dev/null
+++ b/ui/.editorconfig
@@ -0,0 +1,10 @@
+# http://editorconfig.org
+root = true
+
+[*]
+charset=utf-8
+end_of_line=lf
+insert_final_newline=false
+indent_style=space
+indent_size=2
+
diff --git a/ui/.eslintrc b/ui/.eslintrc
index 2a16ad386..82eaebe00 100644
--- a/ui/.eslintrc
+++ b/ui/.eslintrc
@@ -4,7 +4,15 @@
     "es6": true,
     "node": true
   },
-  "plugins": ["@typescript-eslint/eslint-plugin"],
+  "plugins": ["react", "@typescript-eslint/eslint-plugin", "prettier"],
+  "settings": {
+    "import/resolver": {
+      "node": {
+        "extensions": [".tsx", ".ts", ".jsx", ".js", ".json"]
+      },
+      "typescript": {}
+    }
+  },
   "extends": [
     // https://github.com/eslint/eslint/blob/main/conf/eslint-recommended.js
     "eslint:recommended",
@@ -12,7 +20,7 @@
     "react-app",
     // https://reactjs.org/docs/hooks-rules.html
     "plugin:react-hooks/recommended",
-    "prettier"
+    "plugin:prettier/recommended"
   ],
   "parser": "@typescript-eslint/parser",
   "parserOptions": {
@@ -20,7 +28,23 @@
     "sourceType": "module"
   },
   "rules": {
-    "dot-notation": "error"
+    "dot-notation": "error",
+    "import/extensions": [
+      "error",
+      "ignorePackages",
+      {
+        "ts": "never",
+        "tsx": "never",
+        "json": "never",
+        "js": "never",
+        "jsx": "never"
+      }
+    ],
+    "import/no-extraneous-dependencies": ["error", { "devDependencies": true }],
+    "import/prefer-default-export": "off",
+    "import/no-unresolved": "error",
+    "import/no-dynamic-require": "off",
+    "import/no-mutable-exports": "warn"
   },
   "overrides": [
     {
diff --git a/ui/.vscode/settings.json b/ui/.vscode/settings.json
index c8e624dc0..5fffcb522 100644
--- a/ui/.vscode/settings.json
+++ b/ui/.vscode/settings.json
@@ -11,5 +11,8 @@
   ],
   "[css]": {
     "editor.defaultFormatter": "esbenp.prettier-vscode"
+  },
+  "[javascript]": {
+    "editor.defaultFormatter": "esbenp.prettier-vscode"
   }
 }
diff --git a/ui/craco.config.js b/ui/craco.config.js
new file mode 100644
index 000000000..713372305
--- /dev/null
+++ b/ui/craco.config.js
@@ -0,0 +1,51 @@
+const path = require("path");
+
+const { loaderByName } = require("@craco/craco");
+const CracoLessPlugin = require("craco-less");
+
+const resolve = (dir) => path.resolve(__dirname, dir);
+
+module.exports = {
+  babel: {
+    plugins: [
+      [
+        "import",
+        {
+          libraryName: "antd",
+          libraryDirectory: "es",
+          style: true,
+        },
+      ],
+    ],
+  },
+  webpack: {
+    alias: {
+      "@": resolve("src"),
+    },
+  },
+  plugins: [
+    {
+      plugin: CracoLessPlugin,
+      options: {
+        lessLoaderOptions: {
+          lessOptions: {
+            modifyVars: {},
+            javascriptEnabled: true,
+          },
+        },
+        modifyLessModuleRule(lessModuleRule, context) {
+          // Configure the file suffix
+          lessModuleRule.test = /\.module\.less$/;
+
+          // Configure the generated local ident name.
+          const cssLoader = lessModuleRule.use.find(loaderByName("css-loader"));
+          cssLoader.options.modules = {
+            localIdentName: "[local]_[hash:base64:5]",
+          };
+
+          return lessModuleRule;
+        },
+      },
+    },
+  ],
+};
diff --git a/ui/package-lock.json b/ui/package-lock.json
index 28bd6553c..eb39f7e78 100644
--- a/ui/package-lock.json
+++ b/ui/package-lock.json
@@ -8,10 +8,12 @@
       "name": "feathr-ui",
       "version": "0.1.0",
       "dependencies": {
+        "@ant-design/icons": "^4.7.0",
         "@azure/msal-browser": "^2.24.0",
         "@azure/msal-react": "^1.4.0",
         "antd": "^4.20.2",
         "axios": "^0.27.2",
+        "classnames": "^2.3.2",
         "dagre": "^0.8.5",
         "dayjs": "^1.11.5",
         "react": "^17.0.2",
@@ -21,6 +23,7 @@
         "react-router-dom": "^6.3.0"
       },
       "devDependencies": {
+        "@craco/craco": "^7.0.0-alpha.8",
         "@testing-library/jest-dom": "^5.16.3",
         "@testing-library/react": "^12.1.4",
         "@testing-library/user-event": "^13.5.0",
@@ -31,8 +34,13 @@
         "@types/react-dom": "^17.0.14",
         "@typescript-eslint/eslint-plugin": "^5.30.7",
         "@typescript-eslint/parser": "^5.30.7",
+        "babel-plugin-import": "^1.13.5",
+        "craco-less": "^2.1.0-alpha.0",
         "eslint": "^8.20.0",
         "eslint-config-prettier": "^8.5.0",
+        "eslint-import-resolver-typescript": "^3.5.1",
+        "eslint-plugin-import": "^2.26.0",
+        "eslint-plugin-prettier": "^4.2.1",
         "eslint-plugin-react-hooks": "^4.6.0",
         "husky": "^8.0.1",
         "lint-staged": "^13.0.3",
@@ -63,7 +71,8 @@
     },
     "node_modules/@ant-design/icons": {
       "version": "4.7.0",
-      "license": "MIT",
+      "resolved": "https://registry.npmjs.org/@ant-design/icons/-/icons-4.7.0.tgz",
+      "integrity": "sha512-aoB4Z7JA431rt6d4u+8xcNPPCrdufSRMUOpxa1ab6mz1JCQZOEVolj2WVs/tDFmN62zzK30mNelEsprLYsSF3g==",
       "dependencies": {
         "@ant-design/colors": "^6.0.0",
         "@ant-design/icons-svg": "^4.2.1",
@@ -2007,6 +2016,43 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/@craco/craco": {
+      "version": "7.0.0-alpha.8",
+      "resolved": "https://registry.npmjs.org/@craco/craco/-/craco-7.0.0-alpha.8.tgz",
+      "integrity": "sha512-IN3/ldPaktGflPu342cg7n8LYa2c3x9H2XzngUkDzTjro25ig1GyVcUdnG1U0X6wrRTF9K1AxZ5su9jLbdyFUw==",
+      "dev": true,
+      "dependencies": {
+        "autoprefixer": "^10.4.12",
+        "cosmiconfig": "^7.0.1",
+        "cosmiconfig-typescript-loader": "^4.1.1",
+        "cross-spawn": "^7.0.3",
+        "lodash": "^4.17.21",
+        "semver": "^7.3.7",
+        "webpack-merge": "^5.8.0"
+      },
+      "bin": {
+        "craco": "dist/bin/craco.js"
+      },
+      "engines": {
+        "node": ">=6"
+      },
+      "peerDependencies": {
+        "react-scripts": "^5.0.0"
+      }
+    },
+    "node_modules/@cspotcode/source-map-support": {
+      "version": "0.8.1",
+      "resolved": "https://registry.npmjs.org/@cspotcode/source-map-support/-/source-map-support-0.8.1.tgz",
+      "integrity": "sha512-IchNf6dN4tHoMFIn/7OE8LWZ19Y6q/67Bmf6vnGREv8RSbBVb9LPJxEcnwrcwX6ixSvaiGoomAUvu4YSxXrVgw==",
+      "dev": true,
+      "peer": true,
+      "dependencies": {
+        "@jridgewell/trace-mapping": "0.3.9"
+      },
+      "engines": {
+        "node": ">=12"
+      }
+    },
     "node_modules/@csstools/normalize.css": {
       "version": "12.0.0",
       "dev": true,
@@ -2769,6 +2815,32 @@
         "node": ">= 8"
       }
     },
+    "node_modules/@pkgr/utils": {
+      "version": "2.3.1",
+      "resolved": "https://registry.npmjs.org/@pkgr/utils/-/utils-2.3.1.tgz",
+      "integrity": "sha512-wfzX8kc1PMyUILA+1Z/EqoE4UCXGy0iRGMhPwdfae1+f0OXlLqCk+By+aMzgJBzR9AzS4CDizioG6Ss1gvAFJw==",
+      "dev": true,
+      "dependencies": {
+        "cross-spawn": "^7.0.3",
+        "is-glob": "^4.0.3",
+        "open": "^8.4.0",
+        "picocolors": "^1.0.0",
+        "tiny-glob": "^0.2.9",
+        "tslib": "^2.4.0"
+      },
+      "engines": {
+        "node": "^12.20.0 || ^14.18.0 || >=16.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/unts"
+      }
+    },
+    "node_modules/@pkgr/utils/node_modules/tslib": {
+      "version": "2.4.0",
+      "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.4.0.tgz",
+      "integrity": "sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==",
+      "dev": true
+    },
     "node_modules/@pmmmwh/react-refresh-webpack-plugin": {
       "version": "0.5.5",
       "dev": true,
@@ -3246,6 +3318,34 @@
         "node": ">=10.13.0"
       }
     },
+    "node_modules/@tsconfig/node10": {
+      "version": "1.0.9",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node10/-/node10-1.0.9.tgz",
+      "integrity": "sha512-jNsYVVxU8v5g43Erja32laIDHXeoNvFEpX33OK4d6hljo3jDhCBDhx5dhCCTMWUojscpAagGiRkBKxpdl9fxqA==",
+      "dev": true,
+      "peer": true
+    },
+    "node_modules/@tsconfig/node12": {
+      "version": "1.0.11",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node12/-/node12-1.0.11.tgz",
+      "integrity": "sha512-cqefuRsh12pWyGsIoBKJA9luFu3mRxCA+ORZvA4ktLSzIuCUtWVxGIuXigEwO5/ywWFMZ2QEGKWvkZG1zDMTag==",
+      "dev": true,
+      "peer": true
+    },
+    "node_modules/@tsconfig/node14": {
+      "version": "1.0.3",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node14/-/node14-1.0.3.tgz",
+      "integrity": "sha512-ysT8mhdixWK6Hw3i1V2AeRqZ5WfXg1G43mqoYlM2nc6388Fq5jcXyr5mRsqViLx/GJYdoL0bfXD8nmF+Zn/Iow==",
+      "dev": true,
+      "peer": true
+    },
+    "node_modules/@tsconfig/node16": {
+      "version": "1.0.3",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node16/-/node16-1.0.3.tgz",
+      "integrity": "sha512-yOlFc+7UtL/89t2ZhjPvvB/DeAr3r+Dq58IgzsFkOAvVC6NMJXmCGjbptdXdR9qsX7pKcTL+s87FtYREi2dEEQ==",
+      "dev": true,
+      "peer": true
+    },
     "node_modules/@types/aria-query": {
       "version": "4.2.2",
       "dev": true,
@@ -4675,7 +4775,9 @@
       }
     },
     "node_modules/autoprefixer": {
-      "version": "10.4.7",
+      "version": "10.4.12",
+      "resolved": "https://registry.npmjs.org/autoprefixer/-/autoprefixer-10.4.12.tgz",
+      "integrity": "sha512-WrCGV9/b97Pa+jtwf5UGaRjgQIg7OK3D06GnoYoZNcG1Xb8Gt3EfuKjlhh9i/VtT16g6PYjZ69jdJ2g8FxSC4Q==",
       "dev": true,
       "funding": [
         {
@@ -4687,10 +4789,9 @@
           "url": "https://tidelift.com/funding/github/npm/autoprefixer"
         }
       ],
-      "license": "MIT",
       "dependencies": {
-        "browserslist": "^4.20.3",
-        "caniuse-lite": "^1.0.30001335",
+        "browserslist": "^4.21.4",
+        "caniuse-lite": "^1.0.30001407",
         "fraction.js": "^4.2.0",
         "normalize-range": "^0.1.2",
         "picocolors": "^1.0.0",
@@ -4837,6 +4938,15 @@
         "object.assign": "^4.1.0"
       }
     },
+    "node_modules/babel-plugin-import": {
+      "version": "1.13.5",
+      "resolved": "https://registry.npmjs.org/babel-plugin-import/-/babel-plugin-import-1.13.5.tgz",
+      "integrity": "sha512-IkqnoV+ov1hdJVofly9pXRJmeDm9EtROfrc5i6eII0Hix2xMs5FEm8FG3ExMvazbnZBbgHIt6qdO8And6lCloQ==",
+      "dev": true,
+      "dependencies": {
+        "@babel/helper-module-imports": "^7.0.0"
+      }
+    },
     "node_modules/babel-plugin-istanbul": {
       "version": "6.1.1",
       "dev": true,
@@ -5147,7 +5257,9 @@
       "license": "BSD-2-Clause"
     },
     "node_modules/browserslist": {
-      "version": "4.20.3",
+      "version": "4.21.4",
+      "resolved": "https://registry.npmjs.org/browserslist/-/browserslist-4.21.4.tgz",
+      "integrity": "sha512-CBHJJdDmgjl3daYjN5Cp5kbTf1mUhZoS+beLklHIvkOWscs83YAhLlF3Wsh/lciQYAcbBJgTOD44VtG31ZM4Hw==",
       "dev": true,
       "funding": [
         {
@@ -5159,13 +5271,11 @@
           "url": "https://tidelift.com/funding/github/npm/browserslist"
         }
       ],
-      "license": "MIT",
       "dependencies": {
-        "caniuse-lite": "^1.0.30001332",
-        "electron-to-chromium": "^1.4.118",
-        "escalade": "^3.1.1",
-        "node-releases": "^2.0.3",
-        "picocolors": "^1.0.0"
+        "caniuse-lite": "^1.0.30001400",
+        "electron-to-chromium": "^1.4.251",
+        "node-releases": "^2.0.6",
+        "update-browserslist-db": "^1.0.9"
       },
       "bin": {
         "browserslist": "cli.js"
@@ -5271,7 +5381,9 @@
       }
     },
     "node_modules/caniuse-lite": {
-      "version": "1.0.30001336",
+      "version": "1.0.30001422",
+      "resolved": "https://registry.npmjs.org/caniuse-lite/-/caniuse-lite-1.0.30001422.tgz",
+      "integrity": "sha512-hSesn02u1QacQHhaxl/kNMZwqVG35Sz/8DgvmgedxSH8z9UUpcDYSPYgsj3x5dQNRcNp6BwpSfQfVzYUTm+fog==",
       "dev": true,
       "funding": [
         {
@@ -5282,8 +5394,7 @@
           "type": "tidelift",
           "url": "https://tidelift.com/funding/github/npm/caniuse-lite"
         }
-      ],
-      "license": "CC-BY-4.0"
+      ]
     },
     "node_modules/case-sensitive-paths-webpack-plugin": {
       "version": "2.4.0",
@@ -5386,8 +5497,9 @@
       "license": "MIT"
     },
     "node_modules/classnames": {
-      "version": "2.3.1",
-      "license": "MIT"
+      "version": "2.3.2",
+      "resolved": "https://registry.npmjs.org/classnames/-/classnames-2.3.2.tgz",
+      "integrity": "sha512-CSbhY4cFEJRe6/GQzIk5qXZ4Jeg5pcsP7b5peFSDpffpe1cqjASH/n9UTjBwOp6XpMSTwQ8Za2K5V02ueA7Tmw=="
     },
     "node_modules/clean-css": {
       "version": "5.3.0",
@@ -5485,6 +5597,20 @@
         "wrap-ansi": "^7.0.0"
       }
     },
+    "node_modules/clone-deep": {
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/clone-deep/-/clone-deep-4.0.1.tgz",
+      "integrity": "sha512-neHB9xuzh/wk0dIHweyAXv2aPGZIVk3pLMe+/RNzINf17fe0OG96QroktYAUm7SM1PBnzTabaLboqqxDyMU+SQ==",
+      "dev": true,
+      "dependencies": {
+        "is-plain-object": "^2.0.4",
+        "kind-of": "^6.0.2",
+        "shallow-clone": "^3.0.0"
+      },
+      "engines": {
+        "node": ">=6"
+      }
+    },
     "node_modules/clsx": {
       "version": "1.1.1",
       "license": "MIT",
@@ -5592,9 +5718,10 @@
       "license": "MIT"
     },
     "node_modules/colord": {
-      "version": "2.9.2",
-      "dev": true,
-      "license": "MIT"
+      "version": "2.9.3",
+      "resolved": "https://registry.npmjs.org/colord/-/colord-2.9.3.tgz",
+      "integrity": "sha512-jeC1axXpnb0/2nn/Y1LPuLdgXBLH7aDcHu4KEKfqw3CUhX7ZpfBSlPKyqXE6btIgEzfWtrX3/tyBCaCvXvMkOw==",
+      "dev": true
     },
     "node_modules/colorette": {
       "version": "2.0.16",
@@ -5758,6 +5885,18 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/copy-anything": {
+      "version": "2.0.6",
+      "resolved": "https://registry.npmjs.org/copy-anything/-/copy-anything-2.0.6.tgz",
+      "integrity": "sha512-1j20GZTsvKNkc4BY3NpMOM8tt///wY3FpIzozTOFO2ffuZcV61nojHXVKIy3WM+7ADCy5FVhdZYHYDdgTU0yJw==",
+      "dev": true,
+      "dependencies": {
+        "is-what": "^3.14.1"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/mesqueeb"
+      }
+    },
     "node_modules/copy-to-clipboard": {
       "version": "3.3.1",
       "license": "MIT",
@@ -5826,6 +5965,43 @@
         "node": ">=10"
       }
     },
+    "node_modules/cosmiconfig-typescript-loader": {
+      "version": "4.1.1",
+      "resolved": "https://registry.npmjs.org/cosmiconfig-typescript-loader/-/cosmiconfig-typescript-loader-4.1.1.tgz",
+      "integrity": "sha512-9DHpa379Gp0o0Zefii35fcmuuin6q92FnLDffzdZ0l9tVd3nEobG3O+MZ06+kuBvFTSVScvNb/oHA13Nd4iipg==",
+      "dev": true,
+      "engines": {
+        "node": ">=12",
+        "npm": ">=6"
+      },
+      "peerDependencies": {
+        "@types/node": "*",
+        "cosmiconfig": ">=7",
+        "ts-node": ">=10",
+        "typescript": ">=3"
+      }
+    },
+    "node_modules/craco-less": {
+      "version": "2.1.0-alpha.0",
+      "resolved": "https://registry.npmjs.org/craco-less/-/craco-less-2.1.0-alpha.0.tgz",
+      "integrity": "sha512-1kj9Y7Y06Fbae3SJJtz1OvXsaKxjh0jTOwnvzKWOqrojQZbwC2K/d0dxDRUpHTDkIUmxbdzqMmI4LM9JfthQ6Q==",
+      "dev": true,
+      "dependencies": {
+        "less": "^4.1.1",
+        "less-loader": "^7.3.0"
+      },
+      "peerDependencies": {
+        "@craco/craco": ">7.0.0-alpha",
+        "react-scripts": "^5.0.0"
+      }
+    },
+    "node_modules/create-require": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/create-require/-/create-require-1.1.1.tgz",
+      "integrity": "sha512-dcKFX3jn0MpIaXjisoRvexIJVEKzaq7z2rZKxf+MSr9TkdmHmsU4m2lcLojrj/FHl8mk5VxMmYA+ftRkP/3oKQ==",
+      "dev": true,
+      "peer": true
+    },
     "node_modules/cross-spawn": {
       "version": "7.0.3",
       "dev": true,
@@ -6530,6 +6706,16 @@
       "dev": true,
       "license": "Apache-2.0"
     },
+    "node_modules/diff": {
+      "version": "4.0.2",
+      "resolved": "https://registry.npmjs.org/diff/-/diff-4.0.2.tgz",
+      "integrity": "sha512-58lmxKSA4BNyLz+HHMUzlOEpg09FV+ev6ZMe3vJihgdxzgcwZ8VoEEPmALCZG9LmqfVoNMMKpttIYTVG6uDY7A==",
+      "dev": true,
+      "peer": true,
+      "engines": {
+        "node": ">=0.3.1"
+      }
+    },
     "node_modules/diff-sequences": {
       "version": "27.5.1",
       "dev": true,
@@ -6733,9 +6919,10 @@
       }
     },
     "node_modules/electron-to-chromium": {
-      "version": "1.4.134",
-      "dev": true,
-      "license": "ISC"
+      "version": "1.4.284",
+      "resolved": "https://registry.npmjs.org/electron-to-chromium/-/electron-to-chromium-1.4.284.tgz",
+      "integrity": "sha512-M8WEXFuKXMYMVr45fo8mq0wUrrJHheiKZf6BArTKk9ZBYCKJEOU5H8cdWgDT+qCVZf7Na4lVUaZsA+h6uA9+PA==",
+      "dev": true
     },
     "node_modules/emittery": {
       "version": "0.8.1",
@@ -6770,9 +6957,10 @@
       }
     },
     "node_modules/enhanced-resolve": {
-      "version": "5.9.3",
+      "version": "5.10.0",
+      "resolved": "https://registry.npmjs.org/enhanced-resolve/-/enhanced-resolve-5.10.0.tgz",
+      "integrity": "sha512-T0yTFjdpldGY8PmuXXR0PyQ1ufZpEGiHVrp7zHKB7jdR4qlmZHhONVM5AQOAWXuF/w3dnHbEQVrNptJgt7F+cQ==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
         "graceful-fs": "^4.2.4",
         "tapable": "^2.2.0"
@@ -6789,6 +6977,19 @@
         "url": "https://github.com/fb55/entities?sponsor=1"
       }
     },
+    "node_modules/errno": {
+      "version": "0.1.8",
+      "resolved": "https://registry.npmjs.org/errno/-/errno-0.1.8.tgz",
+      "integrity": "sha512-dJ6oBr5SQ1VSd9qkk7ByRgb/1SH4JZjCHSW/mr63/QcXO9zLVxvJ6Oy13nio03rxpSnVDDjFor75SjVeZWPW/A==",
+      "dev": true,
+      "optional": true,
+      "dependencies": {
+        "prr": "~1.0.1"
+      },
+      "bin": {
+        "errno": "cli.js"
+      }
+    },
     "node_modules/error-ex": {
       "version": "1.3.2",
       "dev": true,
@@ -7061,6 +7262,62 @@
         "ms": "^2.1.1"
       }
     },
+    "node_modules/eslint-import-resolver-typescript": {
+      "version": "3.5.1",
+      "resolved": "https://registry.npmjs.org/eslint-import-resolver-typescript/-/eslint-import-resolver-typescript-3.5.1.tgz",
+      "integrity": "sha512-U7LUjNJPYjNsHvAUAkt/RU3fcTSpbllA0//35B4eLYTX74frmOepbt7F7J3D1IGtj9k21buOpaqtDd4ZlS/BYQ==",
+      "dev": true,
+      "dependencies": {
+        "debug": "^4.3.4",
+        "enhanced-resolve": "^5.10.0",
+        "get-tsconfig": "^4.2.0",
+        "globby": "^13.1.2",
+        "is-core-module": "^2.10.0",
+        "is-glob": "^4.0.3",
+        "synckit": "^0.8.3"
+      },
+      "engines": {
+        "node": "^12.20.0 || ^14.18.0 || >=16.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/unts"
+      },
+      "peerDependencies": {
+        "eslint": "*",
+        "eslint-plugin-import": "*"
+      }
+    },
+    "node_modules/eslint-import-resolver-typescript/node_modules/globby": {
+      "version": "13.1.2",
+      "resolved": "https://registry.npmjs.org/globby/-/globby-13.1.2.tgz",
+      "integrity": "sha512-LKSDZXToac40u8Q1PQtZihbNdTYSNMuWe+K5l+oa6KgDzSvVrHXlJy40hUP522RjAIoNLJYBJi7ow+rbFpIhHQ==",
+      "dev": true,
+      "dependencies": {
+        "dir-glob": "^3.0.1",
+        "fast-glob": "^3.2.11",
+        "ignore": "^5.2.0",
+        "merge2": "^1.4.1",
+        "slash": "^4.0.0"
+      },
+      "engines": {
+        "node": "^12.20.0 || ^14.13.1 || >=16.0.0"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
+    "node_modules/eslint-import-resolver-typescript/node_modules/slash": {
+      "version": "4.0.0",
+      "resolved": "https://registry.npmjs.org/slash/-/slash-4.0.0.tgz",
+      "integrity": "sha512-3dOsAHXXUkQTpOYcoAxLIorMTp4gIQr5IW3iVb7A7lFIp0VHhnynm9izx6TssdrIcVIESAlVjtnO2K8bg+Coew==",
+      "dev": true,
+      "engines": {
+        "node": ">=12"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/eslint-module-utils": {
       "version": "2.7.3",
       "dev": true,
@@ -7161,8 +7418,9 @@
     },
     "node_modules/eslint-plugin-import": {
       "version": "2.26.0",
+      "resolved": "https://registry.npmjs.org/eslint-plugin-import/-/eslint-plugin-import-2.26.0.tgz",
+      "integrity": "sha512-hYfi3FXaM8WPLf4S1cikh/r4IxnO6zrhZbEGz2b660EJRbuxgpDS5gkCuYgGWg2xxh2rBuIr4Pvhve/7c31koA==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
         "array-includes": "^3.1.4",
         "array.prototype.flat": "^1.2.5",
@@ -7269,6 +7527,27 @@
         "node": ">=6.0"
       }
     },
+    "node_modules/eslint-plugin-prettier": {
+      "version": "4.2.1",
+      "resolved": "https://registry.npmjs.org/eslint-plugin-prettier/-/eslint-plugin-prettier-4.2.1.tgz",
+      "integrity": "sha512-f/0rXLXUt0oFYs8ra4w49wYZBG5GKZpAYsJSm6rnYL5uVDjd+zowwMwVZHnAjf4edNrKpCDYfXDgmRE/Ak7QyQ==",
+      "dev": true,
+      "dependencies": {
+        "prettier-linter-helpers": "^1.0.0"
+      },
+      "engines": {
+        "node": ">=12.0.0"
+      },
+      "peerDependencies": {
+        "eslint": ">=7.28.0",
+        "prettier": ">=2.0.0"
+      },
+      "peerDependenciesMeta": {
+        "eslint-config-prettier": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/eslint-plugin-react": {
       "version": "7.29.4",
       "dev": true,
@@ -7718,10 +7997,17 @@
       "version": "3.1.3",
       "license": "MIT"
     },
+    "node_modules/fast-diff": {
+      "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/fast-diff/-/fast-diff-1.2.0.tgz",
+      "integrity": "sha512-xJuoT5+L99XlZ8twedaRf6Ax2TgQVxvgZOYoPKqZufmJib0tL2tegPBOZb1pVNgIhlqDlA0eO0c3wBvQcmzx4w==",
+      "dev": true
+    },
     "node_modules/fast-glob": {
-      "version": "3.2.11",
+      "version": "3.2.12",
+      "resolved": "https://registry.npmjs.org/fast-glob/-/fast-glob-3.2.12.tgz",
+      "integrity": "sha512-DVj4CQIYYow0BlaelwK1pHl5n5cRSJfM60UA0zK891sVInoPri2Ekj7+e1CT3/3qxXenpI+nBBmQAcJPJgaj4w==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
         "@nodelib/fs.stat": "^2.0.2",
         "@nodelib/fs.walk": "^1.2.3",
@@ -8251,6 +8537,15 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/get-tsconfig": {
+      "version": "4.2.0",
+      "resolved": "https://registry.npmjs.org/get-tsconfig/-/get-tsconfig-4.2.0.tgz",
+      "integrity": "sha512-X8u8fREiYOE6S8hLbq99PeykTDoLVnxvF4DjWKJmz9xy2nNRdUcV8ZN9tniJFeKyTU3qnC9lL8n4Chd6LmVKHg==",
+      "dev": true,
+      "funding": {
+        "url": "https://github.com/privatenumber/get-tsconfig?sponsor=1"
+      }
+    },
     "node_modules/glob": {
       "version": "7.2.0",
       "license": "ISC",
@@ -8328,6 +8623,12 @@
         "node": ">=4"
       }
     },
+    "node_modules/globalyzer": {
+      "version": "0.1.0",
+      "resolved": "https://registry.npmjs.org/globalyzer/-/globalyzer-0.1.0.tgz",
+      "integrity": "sha512-40oNTM9UfG6aBmuKxk/giHn5nQ8RVz/SS4Ir6zgzOv9/qC3kKZ9v4etGTcJbEl/NyVQH7FGU7d+X1egr57Md2Q==",
+      "dev": true
+    },
     "node_modules/globby": {
       "version": "11.1.0",
       "dev": true,
@@ -8347,6 +8648,12 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/globrex": {
+      "version": "0.1.2",
+      "resolved": "https://registry.npmjs.org/globrex/-/globrex-0.1.2.tgz",
+      "integrity": "sha512-uHJgbwAMwNFf5mLst7IWLNg14x1CkeqglJb/K3doi4dw6q2IvAAmM/Y81kevy83wP+Sst+nutFTYOGg3d1lsxg==",
+      "dev": true
+    },
     "node_modules/graceful-fs": {
       "version": "4.2.10",
       "dev": true,
@@ -8487,11 +8794,6 @@
         "wbuf": "^1.1.0"
       }
     },
-    "node_modules/hpack.js/node_modules/isarray": {
-      "version": "1.0.0",
-      "dev": true,
-      "license": "MIT"
-    },
     "node_modules/hpack.js/node_modules/readable-stream": {
       "version": "2.3.7",
       "dev": true,
@@ -8786,6 +9088,19 @@
         "node": ">= 4"
       }
     },
+    "node_modules/image-size": {
+      "version": "0.5.5",
+      "resolved": "https://registry.npmjs.org/image-size/-/image-size-0.5.5.tgz",
+      "integrity": "sha512-6TDAlDPZxUFCv+fuOkIoXT/V/f3Qbq8e37p+YOiYrUv3v9cc3/6x78VdfPgFVaB9dZYeLUfKgHRebpkm/oP2VQ==",
+      "dev": true,
+      "optional": true,
+      "bin": {
+        "image-size": "bin/image-size.js"
+      },
+      "engines": {
+        "node": ">=0.10.0"
+      }
+    },
     "node_modules/immer": {
       "version": "9.0.12",
       "dev": true,
@@ -8936,9 +9251,10 @@
       }
     },
     "node_modules/is-core-module": {
-      "version": "2.9.0",
+      "version": "2.11.0",
+      "resolved": "https://registry.npmjs.org/is-core-module/-/is-core-module-2.11.0.tgz",
+      "integrity": "sha512-RRjxlvLDkD1YJwDbroBHMb+cukurkDWNyHx7D3oNB5x9rb5ogcksMC5wHCadcXoo67gVr/+3GFySh3134zi6rw==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
         "has": "^1.0.3"
       },
@@ -9066,6 +9382,18 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/is-plain-object": {
+      "version": "2.0.4",
+      "resolved": "https://registry.npmjs.org/is-plain-object/-/is-plain-object-2.0.4.tgz",
+      "integrity": "sha512-h5PpgXkWitc38BBMYawTYMWJHFZJVnBquFE57xFpjB8pJFiF6gZ+bU+WyI/yqXiFR5mdLsgYNaPe8uao6Uv9Og==",
+      "dev": true,
+      "dependencies": {
+        "isobject": "^3.0.1"
+      },
+      "engines": {
+        "node": ">=0.10.0"
+      }
+    },
     "node_modules/is-potential-custom-element-name": {
       "version": "1.0.1",
       "dev": true,
@@ -9168,6 +9496,12 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/is-what": {
+      "version": "3.14.1",
+      "resolved": "https://registry.npmjs.org/is-what/-/is-what-3.14.1.tgz",
+      "integrity": "sha512-sNxgpk9793nzSs7bA6JQJGeIuRBQhAaNGG77kzYQgMkrID+lS6SlK07K5LaptscDlSaIgH+GPFzf+d75FVxozA==",
+      "dev": true
+    },
     "node_modules/is-wsl": {
       "version": "2.2.0",
       "dev": true,
@@ -9179,11 +9513,26 @@
         "node": ">=8"
       }
     },
+    "node_modules/isarray": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/isarray/-/isarray-1.0.0.tgz",
+      "integrity": "sha512-VLghIWNM6ELQzo7zwmcg0NmTVyWKYjvIeM83yjp0wRDTmUnrM678fQbcKBo6n2CJEF0szoG//ytg+TKla89ALQ==",
+      "dev": true
+    },
     "node_modules/isexe": {
       "version": "2.0.0",
       "dev": true,
       "license": "ISC"
     },
+    "node_modules/isobject": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/isobject/-/isobject-3.0.1.tgz",
+      "integrity": "sha512-WhB9zCku7EGTj/HQQRz5aUQEUeoQZH2bWcltRErOpymJ4boYE6wL9Tbr23krRPSZ+C5zqNSrSw+Cc7sZZ4b7vg==",
+      "dev": true,
+      "engines": {
+        "node": ">=0.10.0"
+      }
+    },
     "node_modules/istanbul-lib-coverage": {
       "version": "3.2.0",
       "dev": true,
@@ -10611,38 +10960,116 @@
         "language-subtag-registry": "~0.3.2"
       }
     },
-    "node_modules/leven": {
-      "version": "3.1.0",
+    "node_modules/less": {
+      "version": "4.1.3",
+      "resolved": "https://registry.npmjs.org/less/-/less-4.1.3.tgz",
+      "integrity": "sha512-w16Xk/Ta9Hhyei0Gpz9m7VS8F28nieJaL/VyShID7cYvP6IL5oHeL6p4TXSDJqZE/lNv0oJ2pGVjJsRkfwm5FA==",
       "dev": true,
-      "license": "MIT",
+      "dependencies": {
+        "copy-anything": "^2.0.1",
+        "parse-node-version": "^1.0.1",
+        "tslib": "^2.3.0"
+      },
+      "bin": {
+        "lessc": "bin/lessc"
+      },
       "engines": {
         "node": ">=6"
+      },
+      "optionalDependencies": {
+        "errno": "^0.1.1",
+        "graceful-fs": "^4.1.2",
+        "image-size": "~0.5.0",
+        "make-dir": "^2.1.0",
+        "mime": "^1.4.1",
+        "needle": "^3.1.0",
+        "source-map": "~0.6.0"
       }
     },
-    "node_modules/levn": {
-      "version": "0.4.1",
+    "node_modules/less-loader": {
+      "version": "7.3.0",
+      "resolved": "https://registry.npmjs.org/less-loader/-/less-loader-7.3.0.tgz",
+      "integrity": "sha512-Mi8915g7NMaLlgi77mgTTQvK022xKRQBIVDSyfl3ErTuBhmZBQab0mjeJjNNqGbdR+qrfTleKXqbGI4uEFavxg==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
-        "prelude-ls": "^1.2.1",
-        "type-check": "~0.4.0"
+        "klona": "^2.0.4",
+        "loader-utils": "^2.0.0",
+        "schema-utils": "^3.0.0"
       },
       "engines": {
-        "node": ">= 0.8.0"
+        "node": ">= 10.13.0"
+      },
+      "funding": {
+        "type": "opencollective",
+        "url": "https://opencollective.com/webpack"
+      },
+      "peerDependencies": {
+        "less": "^3.5.0 || ^4.0.0",
+        "webpack": "^4.0.0 || ^5.0.0"
       }
     },
-    "node_modules/lilconfig": {
-      "version": "2.0.5",
+    "node_modules/less/node_modules/make-dir": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/make-dir/-/make-dir-2.1.0.tgz",
+      "integrity": "sha512-LS9X+dc8KLxXCb8dni79fLIIUA5VyZoyjSMCwTluaXA0o27cCK0bhXkpgw+sTXVpPy/lSO57ilRixqk0vDmtRA==",
       "dev": true,
-      "license": "MIT",
+      "optional": true,
+      "dependencies": {
+        "pify": "^4.0.1",
+        "semver": "^5.6.0"
+      },
       "engines": {
-        "node": ">=10"
+        "node": ">=6"
       }
     },
-    "node_modules/lines-and-columns": {
-      "version": "1.2.4",
+    "node_modules/less/node_modules/semver": {
+      "version": "5.7.1",
+      "resolved": "https://registry.npmjs.org/semver/-/semver-5.7.1.tgz",
+      "integrity": "sha512-sauaDf/PZdVgrLTNYHRtpXa1iRiKcaebiKQ1BJdpQlWH2lCvexQdX55snPFyK7QzpudqbCI0qXFfOasHdyNDGQ==",
       "dev": true,
-      "license": "MIT"
+      "optional": true,
+      "bin": {
+        "semver": "bin/semver"
+      }
+    },
+    "node_modules/less/node_modules/tslib": {
+      "version": "2.4.0",
+      "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.4.0.tgz",
+      "integrity": "sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==",
+      "dev": true
+    },
+    "node_modules/leven": {
+      "version": "3.1.0",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=6"
+      }
+    },
+    "node_modules/levn": {
+      "version": "0.4.1",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "prelude-ls": "^1.2.1",
+        "type-check": "~0.4.0"
+      },
+      "engines": {
+        "node": ">= 0.8.0"
+      }
+    },
+    "node_modules/lilconfig": {
+      "version": "2.0.5",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=10"
+      }
+    },
+    "node_modules/lines-and-columns": {
+      "version": "1.2.4",
+      "dev": true,
+      "license": "MIT"
     },
     "node_modules/lint-staged": {
       "version": "13.0.3",
@@ -11040,6 +11467,13 @@
         "semver": "bin/semver.js"
       }
     },
+    "node_modules/make-error": {
+      "version": "1.3.6",
+      "resolved": "https://registry.npmjs.org/make-error/-/make-error-1.3.6.tgz",
+      "integrity": "sha512-s8UhlNe7vPKomQhC1qFelMokr/Sc3AgNbso3n74mVPA5LTZwkB9NlXf4XPamLxJE8h0gh73rM94xvwRT2CVInw==",
+      "dev": true,
+      "peer": true
+    },
     "node_modules/makeerror": {
       "version": "1.0.12",
       "dev": true,
@@ -11296,6 +11730,47 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/needle": {
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/needle/-/needle-3.1.0.tgz",
+      "integrity": "sha512-gCE9weDhjVGCRqS8dwDR/D3GTAeyXLXuqp7I8EzH6DllZGXSUyxuqqLh+YX9rMAWaaTFyVAg6rHGL25dqvczKw==",
+      "dev": true,
+      "optional": true,
+      "dependencies": {
+        "debug": "^3.2.6",
+        "iconv-lite": "^0.6.3",
+        "sax": "^1.2.4"
+      },
+      "bin": {
+        "needle": "bin/needle"
+      },
+      "engines": {
+        "node": ">= 4.4.x"
+      }
+    },
+    "node_modules/needle/node_modules/debug": {
+      "version": "3.2.7",
+      "resolved": "https://registry.npmjs.org/debug/-/debug-3.2.7.tgz",
+      "integrity": "sha512-CFjzYYAi4ThfiQvizrFQevTTXHtnCqWfe7x1AhgEscTz6ZbLbfoLRLPugTQyBth6f8ZERVUSyWHFD/7Wu4t1XQ==",
+      "dev": true,
+      "optional": true,
+      "dependencies": {
+        "ms": "^2.1.1"
+      }
+    },
+    "node_modules/needle/node_modules/iconv-lite": {
+      "version": "0.6.3",
+      "resolved": "https://registry.npmjs.org/iconv-lite/-/iconv-lite-0.6.3.tgz",
+      "integrity": "sha512-4fCk79wshMdzMp2rH06qWrJE4iolqLhCUH+OiuIgU++RB0+94NlDL81atO7GX55uUKueo0txHNtvEyI6D7WdMw==",
+      "dev": true,
+      "optional": true,
+      "dependencies": {
+        "safer-buffer": ">= 2.1.2 < 3.0.0"
+      },
+      "engines": {
+        "node": ">=0.10.0"
+      }
+    },
     "node_modules/negotiator": {
       "version": "0.6.3",
       "dev": true,
@@ -11337,9 +11812,10 @@
       "license": "MIT"
     },
     "node_modules/node-releases": {
-      "version": "2.0.4",
-      "dev": true,
-      "license": "MIT"
+      "version": "2.0.6",
+      "resolved": "https://registry.npmjs.org/node-releases/-/node-releases-2.0.6.tgz",
+      "integrity": "sha512-PiVXnNuFm5+iYkLBNeq5211hvO38y63T0i2KKh2KnUs3RpzJ+JtODFjkD8yjLwnDkTYF1eKXheUwdssR+NRZdg==",
+      "dev": true
     },
     "node_modules/normalize-path": {
       "version": "3.0.0",
@@ -11698,6 +12174,15 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/parse-node-version": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/parse-node-version/-/parse-node-version-1.0.1.tgz",
+      "integrity": "sha512-3YHlOa/JgH6Mnpr05jP9eDG254US9ek25LyIxZlDItp2iJtwyaXQb57lBYLdT3MowkUFYEV2XXNAYIPlESvJlA==",
+      "dev": true,
+      "engines": {
+        "node": ">= 0.10"
+      }
+    },
     "node_modules/parse5": {
       "version": "6.0.1",
       "dev": true,
@@ -11793,6 +12278,16 @@
         "node": ">=0.10"
       }
     },
+    "node_modules/pify": {
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/pify/-/pify-4.0.1.tgz",
+      "integrity": "sha512-uB80kBFb/tfd68bVleG9T5GGsGPjJrLAUpR5PZIrhBnIaRTQRjqdJSsIKkOP6OAIFbj7GOrcudc5pNjZ+geV2g==",
+      "dev": true,
+      "optional": true,
+      "engines": {
+        "node": ">=6"
+      }
+    },
     "node_modules/pirates": {
       "version": "4.0.5",
       "dev": true,
@@ -11928,7 +12423,9 @@
       }
     },
     "node_modules/postcss": {
-      "version": "8.4.13",
+      "version": "8.4.18",
+      "resolved": "https://registry.npmjs.org/postcss/-/postcss-8.4.18.tgz",
+      "integrity": "sha512-Wi8mWhncLJm11GATDaQKobXSNEYGUHeQLiQqDFG1qQ5UTDPTEvKw0Xt5NsTpktGTwLps3ByrWsBrG0rB8YQ9oA==",
       "dev": true,
       "funding": [
         {
@@ -11940,9 +12437,8 @@
           "url": "https://tidelift.com/funding/github/npm/postcss"
         }
       ],
-      "license": "MIT",
       "dependencies": {
-        "nanoid": "^3.3.3",
+        "nanoid": "^3.3.4",
         "picocolors": "^1.0.0",
         "source-map-js": "^1.0.2"
       },
@@ -13085,6 +13581,18 @@
         "url": "https://github.com/prettier/prettier?sponsor=1"
       }
     },
+    "node_modules/prettier-linter-helpers": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/prettier-linter-helpers/-/prettier-linter-helpers-1.0.0.tgz",
+      "integrity": "sha512-GbK2cP9nraSSUF9N2XwUwqfzlAFlMNYYl+ShE/V+H8a9uNl/oUqB1w2EL54Jh0OlyRSd8RfWYJ3coVS4TROP2w==",
+      "dev": true,
+      "dependencies": {
+        "fast-diff": "^1.1.2"
+      },
+      "engines": {
+        "node": ">=6.0.0"
+      }
+    },
     "node_modules/pretty-bytes": {
       "version": "5.6.0",
       "dev": true,
@@ -13188,6 +13696,13 @@
         "node": ">= 0.10"
       }
     },
+    "node_modules/prr": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/prr/-/prr-1.0.1.tgz",
+      "integrity": "sha512-yPw4Sng1gWghHQWj0B3ZggWUm4qVbPwPFcRG8KyxiU7J2OHFSoEHKS+EZ3fv5l1t9CyCiop6l/ZYeWbrgoQejw==",
+      "dev": true,
+      "optional": true
+    },
     "node_modules/psl": {
       "version": "1.8.0",
       "dev": true,
@@ -14964,6 +15479,18 @@
       "dev": true,
       "license": "ISC"
     },
+    "node_modules/shallow-clone": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/shallow-clone/-/shallow-clone-3.0.1.tgz",
+      "integrity": "sha512-/6KqX+GVUdqPuPPd2LxDDxzX6CAbjJehAAOKlNpqqUpAqPM6HeL8f+o3a+JsyGjn2lv0WY8UsTgUJjU9Ok55NA==",
+      "dev": true,
+      "dependencies": {
+        "kind-of": "^6.0.2"
+      },
+      "engines": {
+        "node": ">=8"
+      }
+    },
     "node_modules/shallowequal": {
       "version": "1.1.0",
       "license": "MIT"
@@ -15426,9 +15953,10 @@
       }
     },
     "node_modules/supports-hyperlinks": {
-      "version": "2.2.0",
+      "version": "2.3.0",
+      "resolved": "https://registry.npmjs.org/supports-hyperlinks/-/supports-hyperlinks-2.3.0.tgz",
+      "integrity": "sha512-RpsAZlpWcDwOPQA22aCH4J0t7L8JmAvsCxfOSEwm7cQs3LshN36QaTkwd70DnBOXDWGssw2eUoc8CaRWT0XunA==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
         "has-flag": "^4.0.0",
         "supports-color": "^7.0.0"
@@ -15540,6 +16068,28 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/synckit": {
+      "version": "0.8.4",
+      "resolved": "https://registry.npmjs.org/synckit/-/synckit-0.8.4.tgz",
+      "integrity": "sha512-Dn2ZkzMdSX827QbowGbU/4yjWuvNaCoScLLoMo/yKbu+P4GBR6cRGKZH27k6a9bRzdqcyd1DE96pQtQ6uNkmyw==",
+      "dev": true,
+      "dependencies": {
+        "@pkgr/utils": "^2.3.1",
+        "tslib": "^2.4.0"
+      },
+      "engines": {
+        "node": "^14.18.0 || >=16.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/unts"
+      }
+    },
+    "node_modules/synckit/node_modules/tslib": {
+      "version": "2.4.0",
+      "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.4.0.tgz",
+      "integrity": "sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==",
+      "dev": true
+    },
     "node_modules/tailwindcss": {
       "version": "3.0.24",
       "dev": true,
@@ -15726,6 +16276,16 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/tiny-glob": {
+      "version": "0.2.9",
+      "resolved": "https://registry.npmjs.org/tiny-glob/-/tiny-glob-0.2.9.tgz",
+      "integrity": "sha512-g/55ssRPUjShh+xkfx9UPDXqhckHEsHr4Vd9zX55oSdGZc/MD0m3sferOkwWtp98bv+kcVfEHtRJgBVJzelrzg==",
+      "dev": true,
+      "dependencies": {
+        "globalyzer": "0.1.0",
+        "globrex": "^0.1.2"
+      }
+    },
     "node_modules/tmpl": {
       "version": "1.0.5",
       "dev": true,
@@ -15796,6 +16356,67 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/ts-node": {
+      "version": "10.9.1",
+      "resolved": "https://registry.npmjs.org/ts-node/-/ts-node-10.9.1.tgz",
+      "integrity": "sha512-NtVysVPkxxrwFGUUxGYhfux8k78pQB3JqYBXlLRZgdGUqTO5wU/UyHop5p70iEbGhB7q5KmiZiU0Y3KlJrScEw==",
+      "dev": true,
+      "peer": true,
+      "dependencies": {
+        "@cspotcode/source-map-support": "^0.8.0",
+        "@tsconfig/node10": "^1.0.7",
+        "@tsconfig/node12": "^1.0.7",
+        "@tsconfig/node14": "^1.0.0",
+        "@tsconfig/node16": "^1.0.2",
+        "acorn": "^8.4.1",
+        "acorn-walk": "^8.1.1",
+        "arg": "^4.1.0",
+        "create-require": "^1.1.0",
+        "diff": "^4.0.1",
+        "make-error": "^1.1.1",
+        "v8-compile-cache-lib": "^3.0.1",
+        "yn": "3.1.1"
+      },
+      "bin": {
+        "ts-node": "dist/bin.js",
+        "ts-node-cwd": "dist/bin-cwd.js",
+        "ts-node-esm": "dist/bin-esm.js",
+        "ts-node-script": "dist/bin-script.js",
+        "ts-node-transpile-only": "dist/bin-transpile.js",
+        "ts-script": "dist/bin-script-deprecated.js"
+      },
+      "peerDependencies": {
+        "@swc/core": ">=1.2.50",
+        "@swc/wasm": ">=1.2.50",
+        "@types/node": "*",
+        "typescript": ">=2.7"
+      },
+      "peerDependenciesMeta": {
+        "@swc/core": {
+          "optional": true
+        },
+        "@swc/wasm": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/ts-node/node_modules/acorn-walk": {
+      "version": "8.2.0",
+      "resolved": "https://registry.npmjs.org/acorn-walk/-/acorn-walk-8.2.0.tgz",
+      "integrity": "sha512-k+iyHEuPgSw6SbuDpGQM+06HQUa04DZ3o+F6CSzXMvvI5KMvnaEqXe+YVe555R9nn6GPt404fos4wcgpw12SDA==",
+      "dev": true,
+      "peer": true,
+      "engines": {
+        "node": ">=0.4.0"
+      }
+    },
+    "node_modules/ts-node/node_modules/arg": {
+      "version": "4.1.3",
+      "resolved": "https://registry.npmjs.org/arg/-/arg-4.1.3.tgz",
+      "integrity": "sha512-58S9QDqG0Xx27YwPSt9fJxivjYl432YCwfDMfZ+71RAqUrZef7LrKQZ3LHLOwCS4FLNBplP533Zx895SeOCHvA==",
+      "dev": true,
+      "peer": true
+    },
     "node_modules/tsconfig-paths": {
       "version": "3.14.1",
       "dev": true,
@@ -15998,6 +16619,32 @@
         "yarn": "*"
       }
     },
+    "node_modules/update-browserslist-db": {
+      "version": "1.0.10",
+      "resolved": "https://registry.npmjs.org/update-browserslist-db/-/update-browserslist-db-1.0.10.tgz",
+      "integrity": "sha512-OztqDenkfFkbSG+tRxBeAnCVPckDBcvibKd35yDONx6OU8N7sqgwc7rCbkJ/WcYtVRZ4ba68d6byhC21GFh7sQ==",
+      "dev": true,
+      "funding": [
+        {
+          "type": "opencollective",
+          "url": "https://opencollective.com/browserslist"
+        },
+        {
+          "type": "tidelift",
+          "url": "https://tidelift.com/funding/github/npm/browserslist"
+        }
+      ],
+      "dependencies": {
+        "escalade": "^3.1.1",
+        "picocolors": "^1.0.0"
+      },
+      "bin": {
+        "browserslist-lint": "cli.js"
+      },
+      "peerDependencies": {
+        "browserslist": ">= 4.21.0"
+      }
+    },
     "node_modules/uri-js": {
       "version": "4.4.1",
       "dev": true,
@@ -16051,6 +16698,13 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/v8-compile-cache-lib": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/v8-compile-cache-lib/-/v8-compile-cache-lib-3.0.1.tgz",
+      "integrity": "sha512-wa7YjyUGfNZngI/vtK0UHAN+lgDCxBPCylVXGp0zu59Fz5aiGtNXaq3DhIov063MorB+VfufLh3JlF2KdTK3xg==",
+      "dev": true,
+      "peer": true
+    },
     "node_modules/v8-to-istanbul": {
       "version": "8.1.1",
       "dev": true,
@@ -16359,6 +17013,19 @@
         "node": ">=10.13.0"
       }
     },
+    "node_modules/webpack-merge": {
+      "version": "5.8.0",
+      "resolved": "https://registry.npmjs.org/webpack-merge/-/webpack-merge-5.8.0.tgz",
+      "integrity": "sha512-/SaI7xY0831XwP6kzuwhKWVKDP9t1QY1h65lAFLbZqMPIuYcD9QAW4u9STIbU9kaJbPBB/geU/gLr1wDjOhQ+Q==",
+      "dev": true,
+      "dependencies": {
+        "clone-deep": "^4.0.1",
+        "wildcard": "^2.0.0"
+      },
+      "engines": {
+        "node": ">=10.0.0"
+      }
+    },
     "node_modules/webpack-sources": {
       "version": "3.2.3",
       "dev": true,
@@ -16465,6 +17132,12 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/wildcard": {
+      "version": "2.0.0",
+      "resolved": "https://registry.npmjs.org/wildcard/-/wildcard-2.0.0.tgz",
+      "integrity": "sha512-JcKqAHLPxcdb9KM49dufGXn2x3ssnfjbcaQdLlfZsL9rH9wgDQjUtDxbo8NE0F6SFvydeu1VhZe7hZuHsB2/pw==",
+      "dev": true
+    },
     "node_modules/word-wrap": {
       "version": "1.2.3",
       "dev": true,
@@ -16815,6 +17488,16 @@
         "node": ">=10"
       }
     },
+    "node_modules/yn": {
+      "version": "3.1.1",
+      "resolved": "https://registry.npmjs.org/yn/-/yn-3.1.1.tgz",
+      "integrity": "sha512-Ux4ygGWsu2c7isFWe8Yu1YluJmqVhxqK2cLXNQA5AcC3QfbGNpM7fu0Y8b/z16pXLnFxZYvWhd3fhBY9DLmC6Q==",
+      "dev": true,
+      "peer": true,
+      "engines": {
+        "node": ">=6"
+      }
+    },
     "node_modules/yocto-queue": {
       "version": "0.1.0",
       "dev": true,
@@ -16844,6 +17527,8 @@
     },
     "@ant-design/icons": {
       "version": "4.7.0",
+      "resolved": "https://registry.npmjs.org/@ant-design/icons/-/icons-4.7.0.tgz",
+      "integrity": "sha512-aoB4Z7JA431rt6d4u+8xcNPPCrdufSRMUOpxa1ab6mz1JCQZOEVolj2WVs/tDFmN62zzK30mNelEsprLYsSF3g==",
       "requires": {
         "@ant-design/colors": "^6.0.0",
         "@ant-design/icons-svg": "^4.2.1",
@@ -18016,6 +18701,31 @@
       "version": "0.2.3",
       "dev": true
     },
+    "@craco/craco": {
+      "version": "7.0.0-alpha.8",
+      "resolved": "https://registry.npmjs.org/@craco/craco/-/craco-7.0.0-alpha.8.tgz",
+      "integrity": "sha512-IN3/ldPaktGflPu342cg7n8LYa2c3x9H2XzngUkDzTjro25ig1GyVcUdnG1U0X6wrRTF9K1AxZ5su9jLbdyFUw==",
+      "dev": true,
+      "requires": {
+        "autoprefixer": "^10.4.12",
+        "cosmiconfig": "^7.0.1",
+        "cosmiconfig-typescript-loader": "^4.1.1",
+        "cross-spawn": "^7.0.3",
+        "lodash": "^4.17.21",
+        "semver": "^7.3.7",
+        "webpack-merge": "^5.8.0"
+      }
+    },
+    "@cspotcode/source-map-support": {
+      "version": "0.8.1",
+      "resolved": "https://registry.npmjs.org/@cspotcode/source-map-support/-/source-map-support-0.8.1.tgz",
+      "integrity": "sha512-IchNf6dN4tHoMFIn/7OE8LWZ19Y6q/67Bmf6vnGREv8RSbBVb9LPJxEcnwrcwX6ixSvaiGoomAUvu4YSxXrVgw==",
+      "dev": true,
+      "peer": true,
+      "requires": {
+        "@jridgewell/trace-mapping": "0.3.9"
+      }
+    },
     "@csstools/normalize.css": {
       "version": "12.0.0",
       "dev": true
@@ -18515,6 +19225,28 @@
         "fastq": "^1.6.0"
       }
     },
+    "@pkgr/utils": {
+      "version": "2.3.1",
+      "resolved": "https://registry.npmjs.org/@pkgr/utils/-/utils-2.3.1.tgz",
+      "integrity": "sha512-wfzX8kc1PMyUILA+1Z/EqoE4UCXGy0iRGMhPwdfae1+f0OXlLqCk+By+aMzgJBzR9AzS4CDizioG6Ss1gvAFJw==",
+      "dev": true,
+      "requires": {
+        "cross-spawn": "^7.0.3",
+        "is-glob": "^4.0.3",
+        "open": "^8.4.0",
+        "picocolors": "^1.0.0",
+        "tiny-glob": "^0.2.9",
+        "tslib": "^2.4.0"
+      },
+      "dependencies": {
+        "tslib": {
+          "version": "2.4.0",
+          "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.4.0.tgz",
+          "integrity": "sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==",
+          "dev": true
+        }
+      }
+    },
     "@pmmmwh/react-refresh-webpack-plugin": {
       "version": "0.5.5",
       "dev": true,
@@ -18769,6 +19501,34 @@
       "version": "0.2.0",
       "dev": true
     },
+    "@tsconfig/node10": {
+      "version": "1.0.9",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node10/-/node10-1.0.9.tgz",
+      "integrity": "sha512-jNsYVVxU8v5g43Erja32laIDHXeoNvFEpX33OK4d6hljo3jDhCBDhx5dhCCTMWUojscpAagGiRkBKxpdl9fxqA==",
+      "dev": true,
+      "peer": true
+    },
+    "@tsconfig/node12": {
+      "version": "1.0.11",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node12/-/node12-1.0.11.tgz",
+      "integrity": "sha512-cqefuRsh12pWyGsIoBKJA9luFu3mRxCA+ORZvA4ktLSzIuCUtWVxGIuXigEwO5/ywWFMZ2QEGKWvkZG1zDMTag==",
+      "dev": true,
+      "peer": true
+    },
+    "@tsconfig/node14": {
+      "version": "1.0.3",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node14/-/node14-1.0.3.tgz",
+      "integrity": "sha512-ysT8mhdixWK6Hw3i1V2AeRqZ5WfXg1G43mqoYlM2nc6388Fq5jcXyr5mRsqViLx/GJYdoL0bfXD8nmF+Zn/Iow==",
+      "dev": true,
+      "peer": true
+    },
+    "@tsconfig/node16": {
+      "version": "1.0.3",
+      "resolved": "https://registry.npmjs.org/@tsconfig/node16/-/node16-1.0.3.tgz",
+      "integrity": "sha512-yOlFc+7UtL/89t2ZhjPvvB/DeAr3r+Dq58IgzsFkOAvVC6NMJXmCGjbptdXdR9qsX7pKcTL+s87FtYREi2dEEQ==",
+      "dev": true,
+      "peer": true
+    },
     "@types/aria-query": {
       "version": "4.2.2",
       "dev": true
@@ -19717,11 +20477,13 @@
       "dev": true
     },
     "autoprefixer": {
-      "version": "10.4.7",
+      "version": "10.4.12",
+      "resolved": "https://registry.npmjs.org/autoprefixer/-/autoprefixer-10.4.12.tgz",
+      "integrity": "sha512-WrCGV9/b97Pa+jtwf5UGaRjgQIg7OK3D06GnoYoZNcG1Xb8Gt3EfuKjlhh9i/VtT16g6PYjZ69jdJ2g8FxSC4Q==",
       "dev": true,
       "requires": {
-        "browserslist": "^4.20.3",
-        "caniuse-lite": "^1.0.30001335",
+        "browserslist": "^4.21.4",
+        "caniuse-lite": "^1.0.30001407",
         "fraction.js": "^4.2.0",
         "normalize-range": "^0.1.2",
         "picocolors": "^1.0.0",
@@ -19820,6 +20582,15 @@
         "object.assign": "^4.1.0"
       }
     },
+    "babel-plugin-import": {
+      "version": "1.13.5",
+      "resolved": "https://registry.npmjs.org/babel-plugin-import/-/babel-plugin-import-1.13.5.tgz",
+      "integrity": "sha512-IkqnoV+ov1hdJVofly9pXRJmeDm9EtROfrc5i6eII0Hix2xMs5FEm8FG3ExMvazbnZBbgHIt6qdO8And6lCloQ==",
+      "dev": true,
+      "requires": {
+        "@babel/helper-module-imports": "^7.0.0"
+      }
+    },
     "babel-plugin-istanbul": {
       "version": "6.1.1",
       "dev": true,
@@ -20050,14 +20821,15 @@
       "dev": true
     },
     "browserslist": {
-      "version": "4.20.3",
+      "version": "4.21.4",
+      "resolved": "https://registry.npmjs.org/browserslist/-/browserslist-4.21.4.tgz",
+      "integrity": "sha512-CBHJJdDmgjl3daYjN5Cp5kbTf1mUhZoS+beLklHIvkOWscs83YAhLlF3Wsh/lciQYAcbBJgTOD44VtG31ZM4Hw==",
       "dev": true,
       "requires": {
-        "caniuse-lite": "^1.0.30001332",
-        "electron-to-chromium": "^1.4.118",
-        "escalade": "^3.1.1",
-        "node-releases": "^2.0.3",
-        "picocolors": "^1.0.0"
+        "caniuse-lite": "^1.0.30001400",
+        "electron-to-chromium": "^1.4.251",
+        "node-releases": "^2.0.6",
+        "update-browserslist-db": "^1.0.9"
       }
     },
     "bser": {
@@ -20124,7 +20896,9 @@
       }
     },
     "caniuse-lite": {
-      "version": "1.0.30001336",
+      "version": "1.0.30001422",
+      "resolved": "https://registry.npmjs.org/caniuse-lite/-/caniuse-lite-1.0.30001422.tgz",
+      "integrity": "sha512-hSesn02u1QacQHhaxl/kNMZwqVG35Sz/8DgvmgedxSH8z9UUpcDYSPYgsj3x5dQNRcNp6BwpSfQfVzYUTm+fog==",
       "dev": true
     },
     "case-sensitive-paths-webpack-plugin": {
@@ -20190,7 +20964,9 @@
       "version": "5.0.3"
     },
     "classnames": {
-      "version": "2.3.1"
+      "version": "2.3.2",
+      "resolved": "https://registry.npmjs.org/classnames/-/classnames-2.3.2.tgz",
+      "integrity": "sha512-CSbhY4cFEJRe6/GQzIk5qXZ4Jeg5pcsP7b5peFSDpffpe1cqjASH/n9UTjBwOp6XpMSTwQ8Za2K5V02ueA7Tmw=="
     },
     "clean-css": {
       "version": "5.3.0",
@@ -20249,6 +21025,17 @@
         "wrap-ansi": "^7.0.0"
       }
     },
+    "clone-deep": {
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/clone-deep/-/clone-deep-4.0.1.tgz",
+      "integrity": "sha512-neHB9xuzh/wk0dIHweyAXv2aPGZIVk3pLMe+/RNzINf17fe0OG96QroktYAUm7SM1PBnzTabaLboqqxDyMU+SQ==",
+      "dev": true,
+      "requires": {
+        "is-plain-object": "^2.0.4",
+        "kind-of": "^6.0.2",
+        "shallow-clone": "^3.0.0"
+      }
+    },
     "clsx": {
       "version": "1.1.1"
     },
@@ -20321,7 +21108,9 @@
       "dev": true
     },
     "colord": {
-      "version": "2.9.2",
+      "version": "2.9.3",
+      "resolved": "https://registry.npmjs.org/colord/-/colord-2.9.3.tgz",
+      "integrity": "sha512-jeC1axXpnb0/2nn/Y1LPuLdgXBLH7aDcHu4KEKfqw3CUhX7ZpfBSlPKyqXE6btIgEzfWtrX3/tyBCaCvXvMkOw==",
       "dev": true
     },
     "colorette": {
@@ -20429,6 +21218,15 @@
       "version": "1.0.6",
       "dev": true
     },
+    "copy-anything": {
+      "version": "2.0.6",
+      "resolved": "https://registry.npmjs.org/copy-anything/-/copy-anything-2.0.6.tgz",
+      "integrity": "sha512-1j20GZTsvKNkc4BY3NpMOM8tt///wY3FpIzozTOFO2ffuZcV61nojHXVKIy3WM+7ADCy5FVhdZYHYDdgTU0yJw==",
+      "dev": true,
+      "requires": {
+        "is-what": "^3.14.1"
+      }
+    },
     "copy-to-clipboard": {
       "version": "3.3.1",
       "requires": {
@@ -20472,6 +21270,30 @@
         "yaml": "^1.10.0"
       }
     },
+    "cosmiconfig-typescript-loader": {
+      "version": "4.1.1",
+      "resolved": "https://registry.npmjs.org/cosmiconfig-typescript-loader/-/cosmiconfig-typescript-loader-4.1.1.tgz",
+      "integrity": "sha512-9DHpa379Gp0o0Zefii35fcmuuin6q92FnLDffzdZ0l9tVd3nEobG3O+MZ06+kuBvFTSVScvNb/oHA13Nd4iipg==",
+      "dev": true,
+      "requires": {}
+    },
+    "craco-less": {
+      "version": "2.1.0-alpha.0",
+      "resolved": "https://registry.npmjs.org/craco-less/-/craco-less-2.1.0-alpha.0.tgz",
+      "integrity": "sha512-1kj9Y7Y06Fbae3SJJtz1OvXsaKxjh0jTOwnvzKWOqrojQZbwC2K/d0dxDRUpHTDkIUmxbdzqMmI4LM9JfthQ6Q==",
+      "dev": true,
+      "requires": {
+        "less": "^4.1.1",
+        "less-loader": "^7.3.0"
+      }
+    },
+    "create-require": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/create-require/-/create-require-1.1.1.tgz",
+      "integrity": "sha512-dcKFX3jn0MpIaXjisoRvexIJVEKzaq7z2rZKxf+MSr9TkdmHmsU4m2lcLojrj/FHl8mk5VxMmYA+ftRkP/3oKQ==",
+      "dev": true,
+      "peer": true
+    },
     "cross-spawn": {
       "version": "7.0.3",
       "dev": true,
@@ -20891,6 +21713,13 @@
       "version": "1.2.2",
       "dev": true
     },
+    "diff": {
+      "version": "4.0.2",
+      "resolved": "https://registry.npmjs.org/diff/-/diff-4.0.2.tgz",
+      "integrity": "sha512-58lmxKSA4BNyLz+HHMUzlOEpg09FV+ev6ZMe3vJihgdxzgcwZ8VoEEPmALCZG9LmqfVoNMMKpttIYTVG6uDY7A==",
+      "dev": true,
+      "peer": true
+    },
     "diff-sequences": {
       "version": "27.5.1",
       "dev": true
@@ -21032,7 +21861,9 @@
       }
     },
     "electron-to-chromium": {
-      "version": "1.4.134",
+      "version": "1.4.284",
+      "resolved": "https://registry.npmjs.org/electron-to-chromium/-/electron-to-chromium-1.4.284.tgz",
+      "integrity": "sha512-M8WEXFuKXMYMVr45fo8mq0wUrrJHheiKZf6BArTKk9ZBYCKJEOU5H8cdWgDT+qCVZf7Na4lVUaZsA+h6uA9+PA==",
       "dev": true
     },
     "emittery": {
@@ -21052,7 +21883,9 @@
       "dev": true
     },
     "enhanced-resolve": {
-      "version": "5.9.3",
+      "version": "5.10.0",
+      "resolved": "https://registry.npmjs.org/enhanced-resolve/-/enhanced-resolve-5.10.0.tgz",
+      "integrity": "sha512-T0yTFjdpldGY8PmuXXR0PyQ1ufZpEGiHVrp7zHKB7jdR4qlmZHhONVM5AQOAWXuF/w3dnHbEQVrNptJgt7F+cQ==",
       "dev": true,
       "requires": {
         "graceful-fs": "^4.2.4",
@@ -21063,6 +21896,16 @@
       "version": "2.2.0",
       "dev": true
     },
+    "errno": {
+      "version": "0.1.8",
+      "resolved": "https://registry.npmjs.org/errno/-/errno-0.1.8.tgz",
+      "integrity": "sha512-dJ6oBr5SQ1VSd9qkk7ByRgb/1SH4JZjCHSW/mr63/QcXO9zLVxvJ6Oy13nio03rxpSnVDDjFor75SjVeZWPW/A==",
+      "dev": true,
+      "optional": true,
+      "requires": {
+        "prr": "~1.0.1"
+      }
+    },
     "error-ex": {
       "version": "1.3.2",
       "dev": true,
@@ -21312,6 +22155,42 @@
         }
       }
     },
+    "eslint-import-resolver-typescript": {
+      "version": "3.5.1",
+      "resolved": "https://registry.npmjs.org/eslint-import-resolver-typescript/-/eslint-import-resolver-typescript-3.5.1.tgz",
+      "integrity": "sha512-U7LUjNJPYjNsHvAUAkt/RU3fcTSpbllA0//35B4eLYTX74frmOepbt7F7J3D1IGtj9k21buOpaqtDd4ZlS/BYQ==",
+      "dev": true,
+      "requires": {
+        "debug": "^4.3.4",
+        "enhanced-resolve": "^5.10.0",
+        "get-tsconfig": "^4.2.0",
+        "globby": "^13.1.2",
+        "is-core-module": "^2.10.0",
+        "is-glob": "^4.0.3",
+        "synckit": "^0.8.3"
+      },
+      "dependencies": {
+        "globby": {
+          "version": "13.1.2",
+          "resolved": "https://registry.npmjs.org/globby/-/globby-13.1.2.tgz",
+          "integrity": "sha512-LKSDZXToac40u8Q1PQtZihbNdTYSNMuWe+K5l+oa6KgDzSvVrHXlJy40hUP522RjAIoNLJYBJi7ow+rbFpIhHQ==",
+          "dev": true,
+          "requires": {
+            "dir-glob": "^3.0.1",
+            "fast-glob": "^3.2.11",
+            "ignore": "^5.2.0",
+            "merge2": "^1.4.1",
+            "slash": "^4.0.0"
+          }
+        },
+        "slash": {
+          "version": "4.0.0",
+          "resolved": "https://registry.npmjs.org/slash/-/slash-4.0.0.tgz",
+          "integrity": "sha512-3dOsAHXXUkQTpOYcoAxLIorMTp4gIQr5IW3iVb7A7lFIp0VHhnynm9izx6TssdrIcVIESAlVjtnO2K8bg+Coew==",
+          "dev": true
+        }
+      }
+    },
     "eslint-module-utils": {
       "version": "2.7.3",
       "dev": true,
@@ -21376,6 +22255,8 @@
     },
     "eslint-plugin-import": {
       "version": "2.26.0",
+      "resolved": "https://registry.npmjs.org/eslint-plugin-import/-/eslint-plugin-import-2.26.0.tgz",
+      "integrity": "sha512-hYfi3FXaM8WPLf4S1cikh/r4IxnO6zrhZbEGz2b660EJRbuxgpDS5gkCuYgGWg2xxh2rBuIr4Pvhve/7c31koA==",
       "dev": true,
       "requires": {
         "array-includes": "^3.1.4",
@@ -21448,6 +22329,15 @@
         }
       }
     },
+    "eslint-plugin-prettier": {
+      "version": "4.2.1",
+      "resolved": "https://registry.npmjs.org/eslint-plugin-prettier/-/eslint-plugin-prettier-4.2.1.tgz",
+      "integrity": "sha512-f/0rXLXUt0oFYs8ra4w49wYZBG5GKZpAYsJSm6rnYL5uVDjd+zowwMwVZHnAjf4edNrKpCDYfXDgmRE/Ak7QyQ==",
+      "dev": true,
+      "requires": {
+        "prettier-linter-helpers": "^1.0.0"
+      }
+    },
     "eslint-plugin-react": {
       "version": "7.29.4",
       "dev": true,
@@ -21682,8 +22572,16 @@
     "fast-deep-equal": {
       "version": "3.1.3"
     },
+    "fast-diff": {
+      "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/fast-diff/-/fast-diff-1.2.0.tgz",
+      "integrity": "sha512-xJuoT5+L99XlZ8twedaRf6Ax2TgQVxvgZOYoPKqZufmJib0tL2tegPBOZb1pVNgIhlqDlA0eO0c3wBvQcmzx4w==",
+      "dev": true
+    },
     "fast-glob": {
-      "version": "3.2.11",
+      "version": "3.2.12",
+      "resolved": "https://registry.npmjs.org/fast-glob/-/fast-glob-3.2.12.tgz",
+      "integrity": "sha512-DVj4CQIYYow0BlaelwK1pHl5n5cRSJfM60UA0zK891sVInoPri2Ekj7+e1CT3/3qxXenpI+nBBmQAcJPJgaj4w==",
       "dev": true,
       "requires": {
         "@nodelib/fs.stat": "^2.0.2",
@@ -22016,6 +22914,12 @@
         "get-intrinsic": "^1.1.1"
       }
     },
+    "get-tsconfig": {
+      "version": "4.2.0",
+      "resolved": "https://registry.npmjs.org/get-tsconfig/-/get-tsconfig-4.2.0.tgz",
+      "integrity": "sha512-X8u8fREiYOE6S8hLbq99PeykTDoLVnxvF4DjWKJmz9xy2nNRdUcV8ZN9tniJFeKyTU3qnC9lL8n4Chd6LmVKHg==",
+      "dev": true
+    },
     "glob": {
       "version": "7.2.0",
       "requires": {
@@ -22067,6 +22971,12 @@
       "version": "11.12.0",
       "dev": true
     },
+    "globalyzer": {
+      "version": "0.1.0",
+      "resolved": "https://registry.npmjs.org/globalyzer/-/globalyzer-0.1.0.tgz",
+      "integrity": "sha512-40oNTM9UfG6aBmuKxk/giHn5nQ8RVz/SS4Ir6zgzOv9/qC3kKZ9v4etGTcJbEl/NyVQH7FGU7d+X1egr57Md2Q==",
+      "dev": true
+    },
     "globby": {
       "version": "11.1.0",
       "dev": true,
@@ -22079,6 +22989,12 @@
         "slash": "^3.0.0"
       }
     },
+    "globrex": {
+      "version": "0.1.2",
+      "resolved": "https://registry.npmjs.org/globrex/-/globrex-0.1.2.tgz",
+      "integrity": "sha512-uHJgbwAMwNFf5mLst7IWLNg14x1CkeqglJb/K3doi4dw6q2IvAAmM/Y81kevy83wP+Sst+nutFTYOGg3d1lsxg==",
+      "dev": true
+    },
     "graceful-fs": {
       "version": "4.2.10",
       "dev": true
@@ -22167,10 +23083,6 @@
         "wbuf": "^1.1.0"
       },
       "dependencies": {
-        "isarray": {
-          "version": "1.0.0",
-          "dev": true
-        },
         "readable-stream": {
           "version": "2.3.7",
           "dev": true,
@@ -22356,6 +23268,13 @@
       "version": "5.2.0",
       "dev": true
     },
+    "image-size": {
+      "version": "0.5.5",
+      "resolved": "https://registry.npmjs.org/image-size/-/image-size-0.5.5.tgz",
+      "integrity": "sha512-6TDAlDPZxUFCv+fuOkIoXT/V/f3Qbq8e37p+YOiYrUv3v9cc3/6x78VdfPgFVaB9dZYeLUfKgHRebpkm/oP2VQ==",
+      "dev": true,
+      "optional": true
+    },
     "immer": {
       "version": "9.0.12",
       "dev": true
@@ -22442,7 +23361,9 @@
       "dev": true
     },
     "is-core-module": {
-      "version": "2.9.0",
+      "version": "2.11.0",
+      "resolved": "https://registry.npmjs.org/is-core-module/-/is-core-module-2.11.0.tgz",
+      "integrity": "sha512-RRjxlvLDkD1YJwDbroBHMb+cukurkDWNyHx7D3oNB5x9rb5ogcksMC5wHCadcXoo67gVr/+3GFySh3134zi6rw==",
       "dev": true,
       "requires": {
         "has": "^1.0.3"
@@ -22505,6 +23426,15 @@
       "version": "3.0.0",
       "dev": true
     },
+    "is-plain-object": {
+      "version": "2.0.4",
+      "resolved": "https://registry.npmjs.org/is-plain-object/-/is-plain-object-2.0.4.tgz",
+      "integrity": "sha512-h5PpgXkWitc38BBMYawTYMWJHFZJVnBquFE57xFpjB8pJFiF6gZ+bU+WyI/yqXiFR5mdLsgYNaPe8uao6Uv9Og==",
+      "dev": true,
+      "requires": {
+        "isobject": "^3.0.1"
+      }
+    },
     "is-potential-custom-element-name": {
       "version": "1.0.1",
       "dev": true
@@ -22561,6 +23491,12 @@
         "call-bind": "^1.0.2"
       }
     },
+    "is-what": {
+      "version": "3.14.1",
+      "resolved": "https://registry.npmjs.org/is-what/-/is-what-3.14.1.tgz",
+      "integrity": "sha512-sNxgpk9793nzSs7bA6JQJGeIuRBQhAaNGG77kzYQgMkrID+lS6SlK07K5LaptscDlSaIgH+GPFzf+d75FVxozA==",
+      "dev": true
+    },
     "is-wsl": {
       "version": "2.2.0",
       "dev": true,
@@ -22568,10 +23504,22 @@
         "is-docker": "^2.0.0"
       }
     },
+    "isarray": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/isarray/-/isarray-1.0.0.tgz",
+      "integrity": "sha512-VLghIWNM6ELQzo7zwmcg0NmTVyWKYjvIeM83yjp0wRDTmUnrM678fQbcKBo6n2CJEF0szoG//ytg+TKla89ALQ==",
+      "dev": true
+    },
     "isexe": {
       "version": "2.0.0",
       "dev": true
     },
+    "isobject": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/isobject/-/isobject-3.0.1.tgz",
+      "integrity": "sha512-WhB9zCku7EGTj/HQQRz5aUQEUeoQZH2bWcltRErOpymJ4boYE6wL9Tbr23krRPSZ+C5zqNSrSw+Cc7sZZ4b7vg==",
+      "dev": true
+    },
     "istanbul-lib-coverage": {
       "version": "3.2.0",
       "dev": true
@@ -23554,6 +24502,61 @@
         "language-subtag-registry": "~0.3.2"
       }
     },
+    "less": {
+      "version": "4.1.3",
+      "resolved": "https://registry.npmjs.org/less/-/less-4.1.3.tgz",
+      "integrity": "sha512-w16Xk/Ta9Hhyei0Gpz9m7VS8F28nieJaL/VyShID7cYvP6IL5oHeL6p4TXSDJqZE/lNv0oJ2pGVjJsRkfwm5FA==",
+      "dev": true,
+      "requires": {
+        "copy-anything": "^2.0.1",
+        "errno": "^0.1.1",
+        "graceful-fs": "^4.1.2",
+        "image-size": "~0.5.0",
+        "make-dir": "^2.1.0",
+        "mime": "^1.4.1",
+        "needle": "^3.1.0",
+        "parse-node-version": "^1.0.1",
+        "source-map": "~0.6.0",
+        "tslib": "^2.3.0"
+      },
+      "dependencies": {
+        "make-dir": {
+          "version": "2.1.0",
+          "resolved": "https://registry.npmjs.org/make-dir/-/make-dir-2.1.0.tgz",
+          "integrity": "sha512-LS9X+dc8KLxXCb8dni79fLIIUA5VyZoyjSMCwTluaXA0o27cCK0bhXkpgw+sTXVpPy/lSO57ilRixqk0vDmtRA==",
+          "dev": true,
+          "optional": true,
+          "requires": {
+            "pify": "^4.0.1",
+            "semver": "^5.6.0"
+          }
+        },
+        "semver": {
+          "version": "5.7.1",
+          "resolved": "https://registry.npmjs.org/semver/-/semver-5.7.1.tgz",
+          "integrity": "sha512-sauaDf/PZdVgrLTNYHRtpXa1iRiKcaebiKQ1BJdpQlWH2lCvexQdX55snPFyK7QzpudqbCI0qXFfOasHdyNDGQ==",
+          "dev": true,
+          "optional": true
+        },
+        "tslib": {
+          "version": "2.4.0",
+          "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.4.0.tgz",
+          "integrity": "sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==",
+          "dev": true
+        }
+      }
+    },
+    "less-loader": {
+      "version": "7.3.0",
+      "resolved": "https://registry.npmjs.org/less-loader/-/less-loader-7.3.0.tgz",
+      "integrity": "sha512-Mi8915g7NMaLlgi77mgTTQvK022xKRQBIVDSyfl3ErTuBhmZBQab0mjeJjNNqGbdR+qrfTleKXqbGI4uEFavxg==",
+      "dev": true,
+      "requires": {
+        "klona": "^2.0.4",
+        "loader-utils": "^2.0.0",
+        "schema-utils": "^3.0.0"
+      }
+    },
     "leven": {
       "version": "3.1.0",
       "dev": true
@@ -23816,6 +24819,13 @@
         }
       }
     },
+    "make-error": {
+      "version": "1.3.6",
+      "resolved": "https://registry.npmjs.org/make-error/-/make-error-1.3.6.tgz",
+      "integrity": "sha512-s8UhlNe7vPKomQhC1qFelMokr/Sc3AgNbso3n74mVPA5LTZwkB9NlXf4XPamLxJE8h0gh73rM94xvwRT2CVInw==",
+      "dev": true,
+      "peer": true
+    },
     "makeerror": {
       "version": "1.0.12",
       "dev": true,
@@ -23974,6 +24984,40 @@
       "version": "1.4.0",
       "dev": true
     },
+    "needle": {
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/needle/-/needle-3.1.0.tgz",
+      "integrity": "sha512-gCE9weDhjVGCRqS8dwDR/D3GTAeyXLXuqp7I8EzH6DllZGXSUyxuqqLh+YX9rMAWaaTFyVAg6rHGL25dqvczKw==",
+      "dev": true,
+      "optional": true,
+      "requires": {
+        "debug": "^3.2.6",
+        "iconv-lite": "^0.6.3",
+        "sax": "^1.2.4"
+      },
+      "dependencies": {
+        "debug": {
+          "version": "3.2.7",
+          "resolved": "https://registry.npmjs.org/debug/-/debug-3.2.7.tgz",
+          "integrity": "sha512-CFjzYYAi4ThfiQvizrFQevTTXHtnCqWfe7x1AhgEscTz6ZbLbfoLRLPugTQyBth6f8ZERVUSyWHFD/7Wu4t1XQ==",
+          "dev": true,
+          "optional": true,
+          "requires": {
+            "ms": "^2.1.1"
+          }
+        },
+        "iconv-lite": {
+          "version": "0.6.3",
+          "resolved": "https://registry.npmjs.org/iconv-lite/-/iconv-lite-0.6.3.tgz",
+          "integrity": "sha512-4fCk79wshMdzMp2rH06qWrJE4iolqLhCUH+OiuIgU++RB0+94NlDL81atO7GX55uUKueo0txHNtvEyI6D7WdMw==",
+          "dev": true,
+          "optional": true,
+          "requires": {
+            "safer-buffer": ">= 2.1.2 < 3.0.0"
+          }
+        }
+      }
+    },
     "negotiator": {
       "version": "0.6.3",
       "dev": true
@@ -24005,7 +25049,9 @@
       "dev": true
     },
     "node-releases": {
-      "version": "2.0.4",
+      "version": "2.0.6",
+      "resolved": "https://registry.npmjs.org/node-releases/-/node-releases-2.0.6.tgz",
+      "integrity": "sha512-PiVXnNuFm5+iYkLBNeq5211hvO38y63T0i2KKh2KnUs3RpzJ+JtODFjkD8yjLwnDkTYF1eKXheUwdssR+NRZdg==",
       "dev": true
     },
     "normalize-path": {
@@ -24223,6 +25269,12 @@
         "lines-and-columns": "^1.1.6"
       }
     },
+    "parse-node-version": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/parse-node-version/-/parse-node-version-1.0.1.tgz",
+      "integrity": "sha512-3YHlOa/JgH6Mnpr05jP9eDG254US9ek25LyIxZlDItp2iJtwyaXQb57lBYLdT3MowkUFYEV2XXNAYIPlESvJlA==",
+      "dev": true
+    },
     "parse5": {
       "version": "6.0.1",
       "dev": true
@@ -24280,6 +25332,13 @@
       "version": "0.6.0",
       "dev": true
     },
+    "pify": {
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/pify/-/pify-4.0.1.tgz",
+      "integrity": "sha512-uB80kBFb/tfd68bVleG9T5GGsGPjJrLAUpR5PZIrhBnIaRTQRjqdJSsIKkOP6OAIFbj7GOrcudc5pNjZ+geV2g==",
+      "dev": true,
+      "optional": true
+    },
     "pirates": {
       "version": "4.0.5",
       "dev": true
@@ -24365,10 +25424,12 @@
       }
     },
     "postcss": {
-      "version": "8.4.13",
+      "version": "8.4.18",
+      "resolved": "https://registry.npmjs.org/postcss/-/postcss-8.4.18.tgz",
+      "integrity": "sha512-Wi8mWhncLJm11GATDaQKobXSNEYGUHeQLiQqDFG1qQ5UTDPTEvKw0Xt5NsTpktGTwLps3ByrWsBrG0rB8YQ9oA==",
       "dev": true,
       "requires": {
-        "nanoid": "^3.3.3",
+        "nanoid": "^3.3.4",
         "picocolors": "^1.0.0",
         "source-map-js": "^1.0.2"
       }
@@ -24966,6 +26027,15 @@
       "version": "2.7.1",
       "dev": true
     },
+    "prettier-linter-helpers": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/prettier-linter-helpers/-/prettier-linter-helpers-1.0.0.tgz",
+      "integrity": "sha512-GbK2cP9nraSSUF9N2XwUwqfzlAFlMNYYl+ShE/V+H8a9uNl/oUqB1w2EL54Jh0OlyRSd8RfWYJ3coVS4TROP2w==",
+      "dev": true,
+      "requires": {
+        "fast-diff": "^1.1.2"
+      }
+    },
     "pretty-bytes": {
       "version": "5.6.0",
       "dev": true
@@ -25038,6 +26108,13 @@
         }
       }
     },
+    "prr": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/prr/-/prr-1.0.1.tgz",
+      "integrity": "sha512-yPw4Sng1gWghHQWj0B3ZggWUm4qVbPwPFcRG8KyxiU7J2OHFSoEHKS+EZ3fv5l1t9CyCiop6l/ZYeWbrgoQejw==",
+      "dev": true,
+      "optional": true
+    },
     "psl": {
       "version": "1.8.0",
       "dev": true
@@ -26164,6 +27241,15 @@
       "version": "1.2.0",
       "dev": true
     },
+    "shallow-clone": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/shallow-clone/-/shallow-clone-3.0.1.tgz",
+      "integrity": "sha512-/6KqX+GVUdqPuPPd2LxDDxzX6CAbjJehAAOKlNpqqUpAqPM6HeL8f+o3a+JsyGjn2lv0WY8UsTgUJjU9Ok55NA==",
+      "dev": true,
+      "requires": {
+        "kind-of": "^6.0.2"
+      }
+    },
     "shallowequal": {
       "version": "1.1.0"
     },
@@ -26465,7 +27551,9 @@
       }
     },
     "supports-hyperlinks": {
-      "version": "2.2.0",
+      "version": "2.3.0",
+      "resolved": "https://registry.npmjs.org/supports-hyperlinks/-/supports-hyperlinks-2.3.0.tgz",
+      "integrity": "sha512-RpsAZlpWcDwOPQA22aCH4J0t7L8JmAvsCxfOSEwm7cQs3LshN36QaTkwd70DnBOXDWGssw2eUoc8CaRWT0XunA==",
       "dev": true,
       "requires": {
         "has-flag": "^4.0.0",
@@ -26543,6 +27631,24 @@
       "version": "3.2.4",
       "dev": true
     },
+    "synckit": {
+      "version": "0.8.4",
+      "resolved": "https://registry.npmjs.org/synckit/-/synckit-0.8.4.tgz",
+      "integrity": "sha512-Dn2ZkzMdSX827QbowGbU/4yjWuvNaCoScLLoMo/yKbu+P4GBR6cRGKZH27k6a9bRzdqcyd1DE96pQtQ6uNkmyw==",
+      "dev": true,
+      "requires": {
+        "@pkgr/utils": "^2.3.1",
+        "tslib": "^2.4.0"
+      },
+      "dependencies": {
+        "tslib": {
+          "version": "2.4.0",
+          "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.4.0.tgz",
+          "integrity": "sha512-d6xOpEDfsi2CZVlPQzGeux8XMwLT9hssAsaPYExaQMuYskwb+x1x7J371tWlbBdWHroy99KnVB6qIkUbs5X3UQ==",
+          "dev": true
+        }
+      }
+    },
     "tailwindcss": {
       "version": "3.0.24",
       "dev": true,
@@ -26656,6 +27762,16 @@
       "version": "1.1.0",
       "dev": true
     },
+    "tiny-glob": {
+      "version": "0.2.9",
+      "resolved": "https://registry.npmjs.org/tiny-glob/-/tiny-glob-0.2.9.tgz",
+      "integrity": "sha512-g/55ssRPUjShh+xkfx9UPDXqhckHEsHr4Vd9zX55oSdGZc/MD0m3sferOkwWtp98bv+kcVfEHtRJgBVJzelrzg==",
+      "dev": true,
+      "requires": {
+        "globalyzer": "0.1.0",
+        "globrex": "^0.1.2"
+      }
+    },
     "tmpl": {
       "version": "1.0.5",
       "dev": true
@@ -26704,6 +27820,44 @@
       "version": "1.0.1",
       "dev": true
     },
+    "ts-node": {
+      "version": "10.9.1",
+      "resolved": "https://registry.npmjs.org/ts-node/-/ts-node-10.9.1.tgz",
+      "integrity": "sha512-NtVysVPkxxrwFGUUxGYhfux8k78pQB3JqYBXlLRZgdGUqTO5wU/UyHop5p70iEbGhB7q5KmiZiU0Y3KlJrScEw==",
+      "dev": true,
+      "peer": true,
+      "requires": {
+        "@cspotcode/source-map-support": "^0.8.0",
+        "@tsconfig/node10": "^1.0.7",
+        "@tsconfig/node12": "^1.0.7",
+        "@tsconfig/node14": "^1.0.0",
+        "@tsconfig/node16": "^1.0.2",
+        "acorn": "^8.4.1",
+        "acorn-walk": "^8.1.1",
+        "arg": "^4.1.0",
+        "create-require": "^1.1.0",
+        "diff": "^4.0.1",
+        "make-error": "^1.1.1",
+        "v8-compile-cache-lib": "^3.0.1",
+        "yn": "3.1.1"
+      },
+      "dependencies": {
+        "acorn-walk": {
+          "version": "8.2.0",
+          "resolved": "https://registry.npmjs.org/acorn-walk/-/acorn-walk-8.2.0.tgz",
+          "integrity": "sha512-k+iyHEuPgSw6SbuDpGQM+06HQUa04DZ3o+F6CSzXMvvI5KMvnaEqXe+YVe555R9nn6GPt404fos4wcgpw12SDA==",
+          "dev": true,
+          "peer": true
+        },
+        "arg": {
+          "version": "4.1.3",
+          "resolved": "https://registry.npmjs.org/arg/-/arg-4.1.3.tgz",
+          "integrity": "sha512-58S9QDqG0Xx27YwPSt9fJxivjYl432YCwfDMfZ+71RAqUrZef7LrKQZ3LHLOwCS4FLNBplP533Zx895SeOCHvA==",
+          "dev": true,
+          "peer": true
+        }
+      }
+    },
     "tsconfig-paths": {
       "version": "3.14.1",
       "dev": true,
@@ -26828,6 +27982,16 @@
       "version": "1.2.0",
       "dev": true
     },
+    "update-browserslist-db": {
+      "version": "1.0.10",
+      "resolved": "https://registry.npmjs.org/update-browserslist-db/-/update-browserslist-db-1.0.10.tgz",
+      "integrity": "sha512-OztqDenkfFkbSG+tRxBeAnCVPckDBcvibKd35yDONx6OU8N7sqgwc7rCbkJ/WcYtVRZ4ba68d6byhC21GFh7sQ==",
+      "dev": true,
+      "requires": {
+        "escalade": "^3.1.1",
+        "picocolors": "^1.0.0"
+      }
+    },
     "uri-js": {
       "version": "4.4.1",
       "dev": true,
@@ -26865,6 +28029,13 @@
       "version": "2.3.0",
       "dev": true
     },
+    "v8-compile-cache-lib": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/v8-compile-cache-lib/-/v8-compile-cache-lib-3.0.1.tgz",
+      "integrity": "sha512-wa7YjyUGfNZngI/vtK0UHAN+lgDCxBPCylVXGp0zu59Fz5aiGtNXaq3DhIov063MorB+VfufLh3JlF2KdTK3xg==",
+      "dev": true,
+      "peer": true
+    },
     "v8-to-istanbul": {
       "version": "8.1.1",
       "dev": true,
@@ -27078,6 +28249,16 @@
         }
       }
     },
+    "webpack-merge": {
+      "version": "5.8.0",
+      "resolved": "https://registry.npmjs.org/webpack-merge/-/webpack-merge-5.8.0.tgz",
+      "integrity": "sha512-/SaI7xY0831XwP6kzuwhKWVKDP9t1QY1h65lAFLbZqMPIuYcD9QAW4u9STIbU9kaJbPBB/geU/gLr1wDjOhQ+Q==",
+      "dev": true,
+      "requires": {
+        "clone-deep": "^4.0.1",
+        "wildcard": "^2.0.0"
+      }
+    },
     "webpack-sources": {
       "version": "3.2.3",
       "dev": true
@@ -27137,6 +28318,12 @@
         "is-symbol": "^1.0.3"
       }
     },
+    "wildcard": {
+      "version": "2.0.0",
+      "resolved": "https://registry.npmjs.org/wildcard/-/wildcard-2.0.0.tgz",
+      "integrity": "sha512-JcKqAHLPxcdb9KM49dufGXn2x3ssnfjbcaQdLlfZsL9rH9wgDQjUtDxbo8NE0F6SFvydeu1VhZe7hZuHsB2/pw==",
+      "dev": true
+    },
     "word-wrap": {
       "version": "1.2.3",
       "dev": true
@@ -27405,6 +28592,13 @@
       "version": "20.2.9",
       "dev": true
     },
+    "yn": {
+      "version": "3.1.1",
+      "resolved": "https://registry.npmjs.org/yn/-/yn-3.1.1.tgz",
+      "integrity": "sha512-Ux4ygGWsu2c7isFWe8Yu1YluJmqVhxqK2cLXNQA5AcC3QfbGNpM7fu0Y8b/z16pXLnFxZYvWhd3fhBY9DLmC6Q==",
+      "dev": true,
+      "peer": true
+    },
     "yocto-queue": {
       "version": "0.1.0",
       "dev": true
diff --git a/ui/package.json b/ui/package.json
index dc8ee5e7e..41c6d142a 100644
--- a/ui/package.json
+++ b/ui/package.json
@@ -3,10 +3,12 @@
   "version": "0.1.0",
   "private": true,
   "dependencies": {
+    "@ant-design/icons": "^4.7.0",
     "@azure/msal-browser": "^2.24.0",
     "@azure/msal-react": "^1.4.0",
     "antd": "^4.20.2",
     "axios": "^0.27.2",
+    "classnames": "^2.3.2",
     "dagre": "^0.8.5",
     "dayjs": "^1.11.5",
     "react": "^17.0.2",
@@ -16,9 +18,10 @@
     "react-router-dom": "^6.3.0"
   },
   "devDependencies": {
+    "@craco/craco": "^7.0.0-alpha.8",
     "@testing-library/jest-dom": "^5.16.3",
     "@testing-library/react": "^12.1.4",
-    "@testing-library/user-event": "^13.5.0",
+    "@testing-library/user-event": "^13.5.0", 
     "@types/dagre": "^0.7.47",
     "@types/jest": "^27.5.0",
     "@types/node": "^16.11.26",
@@ -26,8 +29,13 @@
     "@types/react-dom": "^17.0.14",
     "@typescript-eslint/eslint-plugin": "^5.30.7",
     "@typescript-eslint/parser": "^5.30.7",
+    "babel-plugin-import": "^1.13.5",
+    "craco-less": "^2.1.0-alpha.0",
     "eslint": "^8.20.0",
     "eslint-config-prettier": "^8.5.0",
+    "eslint-import-resolver-typescript": "^3.5.1",
+    "eslint-plugin-import": "^2.26.0",
+    "eslint-plugin-prettier": "^4.2.1",
     "eslint-plugin-react-hooks": "^4.6.0",
     "husky": "^8.0.1",
     "lint-staged": "^13.0.3",
@@ -37,9 +45,9 @@
     "web-vitals": "^2.1.4"
   },
   "scripts": {
-    "start": "react-scripts start",
-    "build": "react-scripts build",
-    "test": "react-scripts test",
+    "start": "craco start",
+    "build": "craco build",
+    "test": "craco test",
     "eject": "react-scripts eject",
     "lint:fix": "npx eslint --fix --ext ts --ext tsx  src/ ",
     "format": "npx prettier --write src/**"
diff --git a/ui/src/index.tsx b/ui/src/index.tsx
index 223001bb5..4161e13b2 100644
--- a/ui/src/index.tsx
+++ b/ui/src/index.tsx
@@ -1,8 +1,6 @@
 import React from "react";
 import ReactDOM from "react-dom";
 import App from "./app";
-import "antd/dist/antd.min.css";
-import "./index.less";
 import "./site.css";
 
 ReactDOM.render(
diff --git a/ui/src/pages/home/home.css b/ui/src/pages/home/home.css
deleted file mode 100644
index 308e45367..000000000
--- a/ui/src/pages/home/home.css
+++ /dev/null
@@ -1,23 +0,0 @@
-.home .ant-card {
-  box-shadow: 5px 8px 15px 5px rgba(208, 216, 243, 0.6);
-  border-radius: 8px;
-}
-
-.home .card-meta {
-  display: flex;
-}
-
-.home .card-meta .ant-card-meta-avatar {
-  max-width: 80px;
-  flex-basis: 30%;
-  box-sizing: border-box;
-}
-
-.home .card-meta .ant-card-meta-avatar > span {
-  width: 100%;
-}
-
-.home .card-meta .ant-card-meta-avatar svg {
-  width: 100%;
-  height: auto;
-}
diff --git a/ui/src/pages/home/home.tsx b/ui/src/pages/home/home.tsx
index 88732ffeb..fb3751448 100644
--- a/ui/src/pages/home/home.tsx
+++ b/ui/src/pages/home/home.tsx
@@ -1,14 +1,16 @@
 import React from "react";
-import { Link } from "react-router-dom";
-import { Card, Col, Row, Typography } from "antd";
+
 import {
   CopyOutlined,
   DatabaseOutlined,
   EyeOutlined,
   ProjectOutlined,
 } from "@ant-design/icons";
+import { Card, Col, Row, Typography } from "antd";
+import cs from "classnames";
+import { Link } from "react-router-dom";
 
-import "./home.css";
+import styles from "./index.module.less";
 
 const { Title } = Typography;
 const { Meta } = Card;
@@ -42,7 +44,7 @@ const features = [
 
 const Home = () => {
   return (
-    <div className="page home">
+    <div className={cs("page", styles.home)}>
       <Card>
         <Title level={2}>Welcome to Feathr Feature Store</Title>
         <span>
@@ -71,7 +73,7 @@ const Home = () => {
             >
               <Card>
                 <Meta
-                  className="card-meta"
+                  className={styles.cardMeta}
                   avatar={item.icon}
                   title={
                     <Title level={2} ellipsis>
diff --git a/ui/src/pages/home/index.module.less b/ui/src/pages/home/index.module.less
new file mode 100644
index 000000000..59354c568
--- /dev/null
+++ b/ui/src/pages/home/index.module.less
@@ -0,0 +1,28 @@
+.home {
+  :global {
+    .ant-card {
+      box-shadow: 5px 8px 15px 5px rgba(208, 216, 243, 0.6);
+      border-radius: 8px;
+    }
+  }
+
+  .cardMeta {
+    display: flex;
+    :global {
+      .ant-card-meta-avatar {
+        max-width: 80px;
+        flex-basis: 30%;
+        box-sizing: border-box;
+
+        > span {
+          width: 100%;
+        }
+
+        svg {
+          width: 100%;
+          height: auto;
+        }
+      }
+    }
+  }
+}
diff --git a/ui/src/typings/file.d.ts b/ui/src/typings/file.d.ts
new file mode 100644
index 000000000..ae5426269
--- /dev/null
+++ b/ui/src/typings/file.d.ts
@@ -0,0 +1,44 @@
+declare module "*.svg" {
+  const path: string;
+  export default path;
+}
+
+declare module "*.bmp" {
+  const path: string;
+  export default path;
+}
+
+declare module "*.gif" {
+  const path: string;
+  export default path;
+}
+
+declare module "*.jpg" {
+  const path: string;
+  export default path;
+}
+
+declare module "*.jpeg" {
+  const path: string;
+  export default path;
+}
+
+declare module "*.png" {
+  const path: string;
+  export default path;
+}
+
+declare module "*.css" {
+  const classes: { readonly [key: string]: string };
+  export default classes;
+}
+
+declare module "*.less" {
+  const classes: { readonly [key: string]: string };
+  export default classes;
+}
+
+declare module "*.module.less" {
+  const classes: { readonly [key: string]: string };
+  export default classes;
+}
diff --git a/ui/tsconfig.json b/ui/tsconfig.json
index 9d379a3c4..55d8b5695 100644
--- a/ui/tsconfig.json
+++ b/ui/tsconfig.json
@@ -14,7 +14,20 @@
     "resolveJsonModule": true,
     "isolatedModules": true,
     "noEmit": true,
-    "jsx": "react-jsx"
+    "jsx": "react-jsx",
+    "baseUrl": "./",
+    "rootDir": ".",
+    "paths": {
+      "@/*": ["src/*"]
+    },
+    "plugins": [
+      {
+        "name": "typescript-plugin-css-modules",
+        "options": {
+          "classnameTransform": "camelCaseOnly"
+        }
+      }
+    ]
   },
-  "include": ["src"]
+  "include": ["src", "src/**/*.d.ts"]
 }

From 84dfe3b95cd1e37530032e29773135f3cff587d2 Mon Sep 17 00:00:00 2001
From: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
Date: Tue, 25 Oct 2022 02:32:19 -0700
Subject: [PATCH 38/68] Add dev and notebook dependencies. Add extra dependency
 installation to the test pipeline yml (#773)

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
---
 .github/workflows/pull_request_push_test.yml | 11 +++----
 feathr_project/setup.py                      | 30 +++++++++++++-------
 2 files changed, 24 insertions(+), 17 deletions(-)

diff --git a/.github/workflows/pull_request_push_test.yml b/.github/workflows/pull_request_push_test.yml
index 15981ffc4..1600d102b 100644
--- a/.github/workflows/pull_request_push_test.yml
+++ b/.github/workflows/pull_request_push_test.yml
@@ -87,8 +87,7 @@ jobs:
       - name: Install Feathr Package
         run: |
           python -m pip install --upgrade pip
-          python -m pip install pytest pytest-xdist databricks-cli
-          python -m pip install -e ./feathr_project/
+          python -m pip install -e ./feathr_project/[all]
           if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
       - name: Set env variable and upload jars
         env:
@@ -165,8 +164,7 @@ jobs:
       - name: Install Feathr Package
         run: |
           python -m pip install --upgrade pip
-          python -m pip install pytest pytest-xdist
-          python -m pip install -e ./feathr_project/
+          python -m pip install -e ./feathr_project/[all]
           if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
       - name: Run Feathr with Azure Synapse
         env:
@@ -226,9 +224,8 @@ jobs:
       - name: Install Feathr Package
         run: |
           python -m pip install --upgrade pip
-          python -m pip install pytest pytest-xdist
-          python -m pip install -e ./feathr_project/
-          if [ -f requirements.txt ]; then pip install -r requirements.txt; fi          
+          python -m pip install -e ./feathr_project/[all]
+          if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
       - name: Run Feathr with Local Spark
         env:
           PROJECT_CONFIG__PROJECT_NAME: "feathr_github_ci_local"
diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index 4f766b4ec..69a99351f 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -15,7 +15,24 @@
     sys.exit(-1)
 
 VERSION = __version__  # noqa
-os.environ["FEATHR_VERSION"] = VERSION   
+os.environ["FEATHR_VERSION]"] = VERSION
+
+extras_require=dict(
+    dev=[
+        "black>=22.1.0",    # formatter
+        "isort",            # sort import statements
+        "pytest>=7",
+        "pytest-xdist",
+        "pytest-mock>=3.8.1",
+    ],
+    notebook=[
+        "jupyter==1.0.0",
+        "matplotlib==3.6.1",
+        "papermill>=2.1.2,<3",      # to test run notebooks
+        "scrapbook>=0.5.0,<1.0.0",  # to scrap notebook outputs
+    ],
+)
+extras_require["all"] = list(set(sum([*extras_require.values()], [])))
 
 setup(
     name='feathr',
@@ -63,7 +80,7 @@
         # https://github.com/Azure/azure-sdk-for-python/pull/22891
         # using a version lower than that to workaround this issue.
         "azure-core<=1.22.1",
-        # azure-core 1.22.1 is dependent on msrest==0.6.21, if an environment(AML) has a different version of azure-core (say 1.24.0), 
+        # azure-core 1.22.1 is dependent on msrest==0.6.21, if an environment(AML) has a different version of azure-core (say 1.24.0),
         # it brings a different version of msrest(0.7.0) which is incompatible with azure-core==1.22.1. Hence we need to pin it.
         # See this for more details: https://github.com/Azure/azure-sdk-for-python/issues/24765
         "msrest<=0.6.21",
@@ -72,14 +89,7 @@
     tests_require=[  # TODO: This has been depricated
         "pytest",
     ],
-    extras_require=dict(
-        dev=[
-            "black>=22.1.0",    # formatter
-            "isort",            # sort import statements
-            "pytest>=7",
-            "pytest-mock>=3.8.1",
-        ],
-    ),
+    extras_require=extras_require,
     entry_points={
         'console_scripts': ['feathr=feathrcli.cli:cli']
     },

From 07f603394f285db968974ec67ddf05376db44de6 Mon Sep 17 00:00:00 2001
From: Xiaoyong Zhu <xiaoyongzhu@users.noreply.github.com>
Date: Tue, 25 Oct 2022 03:40:22 -0700
Subject: [PATCH 39/68] Fix Windows compatibility issues (#776)

* Update _databricks_submission.py

* Update feathr-configuration-and-env.md

* Update feathr-configuration-and-env.md

* Update _databricks_submission.py
---
 .../feathr-configuration-and-env.md           | 10 +++---
 .../spark_provider/_databricks_submission.py  | 36 ++++++++++---------
 2 files changed, 26 insertions(+), 20 deletions(-)

diff --git a/docs/how-to-guides/feathr-configuration-and-env.md b/docs/how-to-guides/feathr-configuration-and-env.md
index e5c6b761a..803af55a6 100644
--- a/docs/how-to-guides/feathr-configuration-and-env.md
+++ b/docs/how-to-guides/feathr-configuration-and-env.md
@@ -38,17 +38,17 @@ Feathr will get the configurations in the following order:
 | AZURE_CLIENT_ID                                       | Client ID for authentication into Azure Services. Read [here](https://docs.microsoft.com/en-us/python/api/azure-identity/azure.identity.environmentcredential?view=azure-python) for more details.                                                                                 | This is required if you are using Service Principal to login with Feathr. |
 | AZURE_TENANT_ID                                       | Client ID for authentication into Azure Services. Read [here](https://docs.microsoft.com/en-us/python/api/azure-identity/azure.identity.environmentcredential?view=azure-python) for more details.                                                                                 | This is required if you are using Service Principal to login with Feathr. |
 | AZURE_CLIENT_SECRET                                   | Client ID for authentication into Azure Services. Read [here](https://docs.microsoft.com/en-us/python/api/azure-identity/azure.identity.environmentcredential?view=azure-python) for more details.                                                                                 | This is required if you are using Service Principal to login with Feathr. |
-| OFFLINE_STORE__ADLS__ADLS_ENABLED                     | Whether to enable ADLS as offline store or not.                                                                                                                                                                                                                                    | Optional                                                                  |
+| OFFLINE_STORE__ADLS__ADLS_ENABLED                     | Whether to enable ADLS as offline store or not. Available value: "True" or "False". Equivalent to "False" if not set.                                                                                                                                                                                                                                    | Optional                                                                  |
 | ADLS_ACCOUNT                                          | ADLS account that you connect to.                                                                                                                                                                                                                                                  | Required if using ADLS as an offline store.                               |
 | ADLS_KEY                                              | ADLS key that you connect to.                                                                                                                                                                                                                                                      | Required if using ADLS as an offline store.                               |
-| OFFLINE_STORE__WASB__WASB_ENABLED                     | Whether to enable Azure BLOB storage as offline store or not.                                                                                                                                                                                                                      |
+| OFFLINE_STORE__WASB__WASB_ENABLED                     | Whether to enable Azure BLOB storage as offline store or not. Available value: "True" or "False". Equivalent to "False" if not set.                                                                                                                                                                                                                      |
 | WASB_ACCOUNT                                          | Azure BLOB Storage account that you connect to.                                                                                                                                                                                                                                    | Required if using Azure BLOB Storage as an offline store.                 |
 | WASB_KEY                                              | Azure BLOB Storage key that you connect to.                                                                                                                                                                                                                                        | Required if using Azure BLOB Storage as an offline store.                 |
 | S3_ACCESS_KEY                                         | AWS S3 access key for the S3 account.                                                                                                                                                                                                                                              | Required if using AWS S3 Storage as an offline store.                     |
 | S3_SECRET_KEY                                         | AWS S3 secret key for the S3 account.                                                                                                                                                                                                                                              | Required if using AWS S3 Storage as an offline store.                     |
-| OFFLINE_STORE__S3__S3_ENABLED                         | Whether to enable S3 as offline store or not.                                                                                                                                                                                                                                      | Optional                                                                  |
+| OFFLINE_STORE__S3__S3_ENABLED                         | Whether to enable S3 as offline store or not. Available value: "True" or "False". Equivalent to "False" if not set.                                                                                                                                                                                                                                      | Optional                                                                  |
 | OFFLINE_STORE__S3__S3_ENDPOINT                        | S3 endpoint. If you use S3 endpoint, then you need to provide access key and secret key in the environment variable as well.                                                                                                                                                       | Required if using AWS S3 Storage as an offline store.                     |
-| OFFLINE_STORE__JDBC__JDBC_ENABLED                     | Whether to enable JDBC as offline store or not.                                                                                                                                                                                                                                    | Optional                                                                  |
+| OFFLINE_STORE__JDBC__JDBC_ENABLED                     | Whether to enable JDBC as offline store or not. Available value: "True" or "False". Equivalent to "False" if not set.                                                                                                                                                                                                                                    | Optional                                                                  |
 | OFFLINE_STORE__JDBC__JDBC_DATABASE                    | If using JDBC endpoint as offline store, this config specifies the JDBC database to read from.                                                                                                                                                                                     | Required if using JDBC sources as offline store                           |
 | OFFLINE_STORE__JDBC__JDBC_TABLE                       | If using JDBC endpoint as offline store, this config specifies the JDBC table to read from. Same as `JDBC_TABLE`.                                                                                                                                                                  | Required if using JDBC sources as offline store                           |
 | JDBC_TABLE                                            | If using JDBC endpoint as offline store, this config specifies the JDBC table to read from                                                                                                                                                                                         | Required if using JDBC sources as offline store                           |
@@ -56,6 +56,7 @@ Feathr will get the configurations in the following order:
 | JDBC_PASSWORD                                         | If using JDBC endpoint as offline store, this config specifies the JDBC password                                                                                                                                                                                                   | Required if using JDBC sources as offline store                           |
 | KAFKA_SASL_JAAS_CONFIG                                | see [here](#KAFKA_SASL_JAAS_CONFIG) for more details. | Required if using Kafka/EventHub as streaming source input.               |
 | PROJECT_CONFIG__PROJECT_NAME                        | Configures the project name.                                                                                                                                                                                                                                                       | Required                                                                  |
+| OFFLINE_STORE__SNOWFLAKE__SNOWFLAKE_ENABLED                         | Configures whether Snowflake as offline store is enabled or not. Available value: "True" or "False". Equivalent to "False" if not set.                                                                                                                                                                                 | Required if using Snowflake as an offline store.                          |
 | OFFLINE_STORE__SNOWFLAKE__URL                         | Configures the Snowflake URL. Usually it's something like `dqllago-ol19457.snowflakecomputing.com`.                                                                                                                                                                                | Required if using Snowflake as an offline store.                          |
 | OFFLINE_STORE__SNOWFLAKE__USER                        | Configures the Snowflake user.                                                                                                                                                                                                                                                     | Required if using Snowflake as an offline store.                          |
 | OFFLINE_STORE__SNOWFLAKE__ROLE                        | Configures the Snowflake role. Usually it's something like `ACCOUNTADMIN`.                                                                                                                                                                                                         | Required if using Snowflake as an offline store.                          |
@@ -72,6 +73,7 @@ Feathr will get the configurations in the following order:
 | SPARK_CONFIG__DATABRICKS__CONFIG_TEMPLATE             | Config string including run time information, spark version, machine size, etc. See [below](#SPARK_CONFIG__DATABRICKS__CONFIG_TEMPLATE) for more details.                                                                                                                                | Required if using Databricks                                              |
 | SPARK_CONFIG__DATABRICKS__WORK_DIR                    | Workspace dir for storing all the required configuration files and the jar resources. All the feature definitions will be uploaded here.                                                                                                                                           | Required if using Databricks                                              |
 | SPARK_CONFIG__DATABRICKS__FEATHR_RUNTIME_LOCATION     | Feathr runtime location. Support local paths, path start with `http(s)://`, and paths start with `dbfs:/`. If not set, will use the [Feathr package published in Maven](https://search.maven.org/artifact/com.linkedin.feathr/feathr_2.12).                                        | Required if using Databricks                                              |
+| DATABRICKS_WORKSPACE_TOKEN_VALUE      | Token value to access databricks workspace. More details can be found at [Authentication using Databricks personal access tokens](https://docs.databricks.com/dev-tools/api/latest/authentication.html)                                        | Required if using Databricks                                              |
 | ONLINE_STORE__REDIS__HOST                             | Redis host name to access Redis cluster.                                                                                                                                                                                                                                           | Required if using Redis as online store.                                  |
 | ONLINE_STORE__REDIS__PORT                             | Redis port number to access Redis cluster.                                                                                                                                                                                                                                         | Required if using Redis as online store.                                  |
 | ONLINE_STORE__REDIS__SSL_ENABLED                      | Whether SSL is enabled to access Redis cluster.                                                                                                                                                                                                                                    | Required if using Redis as online store.                                  |
diff --git a/feathr_project/feathr/spark_provider/_databricks_submission.py b/feathr_project/feathr/spark_provider/_databricks_submission.py
index ac4d7f7fb..cfff0180e 100644
--- a/feathr_project/feathr/spark_provider/_databricks_submission.py
+++ b/feathr_project/feathr/spark_provider/_databricks_submission.py
@@ -69,8 +69,10 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
         """
         src_parse_result = urlparse(local_path_or_http_path)
         file_name = os.path.basename(local_path_or_http_path)
-        # returned paths for the uploaded file
-        returned_path = os.path.join(self.databricks_work_dir, file_name)
+        # returned paths for the uploaded file. Note that we cannot use os.path.join here, since in Windows system it will yield paths like this:
+        # dbfs:/feathrazure_cijob_snowflake_9_30_157692\auto_generated_derived_features.conf, where the path sep is mixed, and won't be able to be parsed by databricks.
+        # so we force the path to be Linux style here.
+        cloud_dest_path = self.databricks_work_dir + "/" + file_name
         if src_parse_result.scheme.startswith('http'):
             with urlopen(local_path_or_http_path) as f:
                 # use REST API to avoid local temp file
@@ -78,14 +80,14 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
                 files = {'file': data}
                 # for DBFS APIs, see: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/dbfs
                 r = requests.post(url=self.workspace_instance_url+'/api/2.0/dbfs/put',
-                                  headers=self.auth_headers, files=files,  data={'overwrite': 'true', 'path': returned_path})
+                                  headers=self.auth_headers, files=files,  data={'overwrite': 'true', 'path': cloud_dest_path})
                 logger.info('{} is downloaded and then uploaded to location: {}',
-                             local_path_or_http_path, returned_path)
+                             local_path_or_http_path, cloud_dest_path)
         elif src_parse_result.scheme.startswith('dbfs'):
             # passed a cloud path
             logger.info(
                 'Skip uploading file {} as the file starts with dbfs:/', local_path_or_http_path)
-            returned_path = local_path_or_http_path
+            cloud_dest_path = local_path_or_http_path
         elif src_parse_result.scheme.startswith(('wasb','s3','gs')):
             # if the path starts with a location that's not a local path
             logger.error("File {} cannot be downloaded. Please upload the file to dbfs manually.", local_path_or_http_path)
@@ -96,27 +98,29 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
                 logger.info("Uploading folder {}", local_path_or_http_path)
                 dest_paths = []
                 for item in Path(local_path_or_http_path).glob('**/*.conf'):
-                    returned_path = self.upload_local_file(item.resolve())
-                    dest_paths.extend([returned_path])
-                returned_path = ','.join(dest_paths)
+                    cloud_dest_path = self._upload_local_file_to_workspace(item.resolve())
+                    dest_paths.extend([cloud_dest_path])
+                cloud_dest_path = ','.join(dest_paths)
             else:
-                returned_path = self.upload_local_file(local_path_or_http_path)
-        return returned_path
+                cloud_dest_path = self._upload_local_file_to_workspace(local_path_or_http_path)
+        return cloud_dest_path
 
-    def upload_local_file(self, local_path: str) -> str:
+    def _upload_local_file_to_workspace(self, local_path: str) -> str:
         """
         Supports transferring file from a local path to cloud working storage.
         """
         file_name = os.path.basename(local_path)
-        # returned paths for the uploaded file
-        returned_path = os.path.join(self.databricks_work_dir, file_name)
+        # returned paths for the uploaded file. Note that we cannot use os.path.join here, since in Windows system it will yield paths like this:
+        # dbfs:/feathrazure_cijob_snowflake_9_30_157692\auto_generated_derived_features.conf, where the path sep is mixed, and won't be able to be parsed by databricks.
+        # so we force the path to be Linux style here.
+        cloud_dest_path = self.databricks_work_dir + "/" + file_name
         # `local_path_or_http_path` will be either string or PathLib object, so normalize it to string
         local_path = str(local_path)
         try:
-            DbfsApi(self.api_client).cp(recursive=True, overwrite=True, src=local_path, dst=returned_path)
+            DbfsApi(self.api_client).cp(recursive=True, overwrite=True, src=local_path, dst=cloud_dest_path)
         except RuntimeError as e:
-            raise RuntimeError(f"The source path: {local_path}, or the destination path: {returned_path}, is/are not valid.") from e
-        return returned_path
+            raise RuntimeError(f"The source path: {local_path}, or the destination path: {cloud_dest_path}, is/are not valid.") from e
+        return cloud_dest_path
 
     def submit_feathr_job(self, job_name: str, main_jar_path: str,  main_class_name: str, arguments: List[str], python_files: List[str], reference_files_path: List[str] = [], job_tags: Dict[str, str] = None, configuration: Dict[str, str] = {}, properties: Dict[str, str] = {}):
         """

From 5a7c8e2765940c69acd34021bbbe86eff0776426 Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Wed, 26 Oct 2022 20:39:50 +0800
Subject: [PATCH 40/68] UI: Replace logo icon (#778)

Signed-off-by: Boli Guan <ifendoe@gmail.com>
---
 ui/public/favicon.ico   | Bin 3870 -> 165662 bytes
 ui/public/index.html    |   2 +-
 ui/public/logo192.png   | Bin 5347 -> 0 bytes
 ui/public/logo200.png   | Bin 0 -> 10726 bytes
 ui/public/logo512.png   | Bin 9664 -> 0 bytes
 ui/public/manifest.json |   9 ++-------
 6 files changed, 3 insertions(+), 8 deletions(-)
 delete mode 100644 ui/public/logo192.png
 create mode 100644 ui/public/logo200.png
 delete mode 100644 ui/public/logo512.png

diff --git a/ui/public/favicon.ico b/ui/public/favicon.ico
index a11777cc471a4344702741ab1c8a588998b1311a..fc2f6ca0fcb001c306e8fbe56006540e6127f23b 100644
GIT binary patch
literal 165662
zcmeHQ3tUxI*1t$aebanS(@Zs`g5m=a6>)MZA5@lR(U@tOS!wpAshO|QvK&FHv4`2i
z9#EMxqgGU=(L*x}>|th%CJHg*3o(j;6hu%IVt@a2U!2E2=bm%97cQ{ucjKP3&pG$(
zwf_IT_F8-IwH=Ny{I_+h1OJb5oVmD-<2;AM5rYp-Ii3k~oyS*)V`dxYALajq5DxyZ
z3>X890mcAhfHA-rU<@z@7z2y}#sFi0F~AsL3@`>51B?O20AqkLz!+c*Fa{U{i~+^~
zV}LQh7+?%A1{ed30mcAhfHA-rU<@z@7z2y}#sFi0F~AsL3@`>51B?O20AqkLz!+c*
zFa{U{i~+^~V}LQh7+?%A1{ed30mcAhfHA-rU<@z@7z2y}#sFi0F~AsL3@`>51B?O2
z0AqkLz!+c*Fa{U{i~+^~V}LQh7+?%A1{ed30mcAhfHA-rU<@z@7z2!fW{-iIiZjH4
z<b@)C;%8#dtj9%7#s4(>I`MvUyx(4+FtBIV6C%5>@P6_qrZGRb-DeEAF_7K&TQ4_U
zJgFAP3(jHrFh>{zz`(u-pVsh0h{7c^SvJfM#sDx-k$n;PaZ1IJ?F0YKvSEHO2HY6P
zpSViJ59()?W?aqkVUDy04D8&wv%`|7p1L<ZJ^c!4eM>VEbo|Ik`b2tdpyC4j9F8%C
z00s&R3(xJ+ty}Sh?b-?Y+&N*wd@1g8k~Zl$Qknrn!fhzapygr!c4MN48}7fA;EX;#
zRhn^)jvqNmYZx0X7aOcw;dm)E^#%<;#N;Vc9@fdGw$dTK8=9rz$S<O7^QF3L*`{#c
zsD)slyu7>(`d5V-jvRvx`Hc?ur5S(H@I#24q)gp)Ekrh4FSd<@0oaQtH2e_LXUw=?
ziVxz0ay;D?%Sx19%RFH_(gHBBapT6`T7KZT=-9Dir|EECnvtmEM^4hmy6akiT)0kb
zKRg)dcgZDRYdNxV<;vlna@F6RL$~WVLVYjh1lx-iiUGv2Mr!#nbl9-9Qp^{n-lOA3
zPSSemwJlU$T-VlTTVO*z)pF#`^z@5$Sg5TG7dsO7=r~fcW{B=u<_Fu97J>nAVThI=
z;EaI{NgJo*N8Z?Xm>;dLU2RP|2OqX+I8q1R#Oq{GQ_%)CBv-?cQ<%@#UUzK^X+OAL
z%zgMF!!`U6CN|^-4L=0d8NSRoVjQ(p3}C!4EG9N~yM`l1HY5z=gIhElseuiNZmII&
zdNKDg=j3t?KSX>&LMFyT!gTm3+Z+#msMm+&j+Of?+|OcPy@g<a`cztupzk$W#}BG+
z{=_938$#<tT23shrXmbB@qB#Z@EIhE(yqs6I6k-IbA$7HX~tD3>xWNAQC$=vl~W7B
z2G>nE$R`Iseo=A+{jNRef9c26tBcM7KMt!nl9Ti`a-HbyO{ikzWJv_D9V?1gUkAKT
zL#~#m!TWWn({6mKRdv(OuaO`B7x9a4@QhVhkGw#XtVzQ2FJNr7oc<Zc2RA7BLEm9R
zCQEgEaLF_shNz7VB|cOaoeqq~fCJR#&jxm16uDzI;=T9cQ=@x-IqvIox%gN91Ag~y
z=NkU9%{@X&KB1(mX7DbUUvj;cA2|N8xVZQ%onC7yP7~V)?pI-KN8(P{kT$w&gI)KE
z>_3RZ>#ua$f&7WjfdlIsnFDq>Q~+D`3OG9g{jy&-x~zh&ix&KR_~YT|Q{`$o0vmF-
zRF8#Ar>git?Q2omEz)ZnDz}=7aM*&*qIl(v&i)JaV|FBF<M%6c@8DlMZwKRny0#ke
zz>h>x>S*?1nnynjHe?X^q4GnbyL8$2lgx&kIue03RJ&C8+&-{SoI2uP&c%}@XNbzY
zZs@yTCkmI|C-%%p6M17lhMoEkenTBIYd##X%B5qd>w9QlCPD@m1*MH?XdA`%JL8cf
zM~zycwINs^vQVnCBbj}H-CtB3DO@^DdaYKzWtlyIhe_z4zXn@CesN>@1XeNIRM*wP
zu53a(G0c)2wQ}X-pvKj|+Op*$@S{q@k>fbuL8`C(i7%-5v3=n8(pXk)WgEnSuR#C%
zSzKSBx+jSCpk!0L*tW8#So2h@czSL(F?)PxG3uI*VnDx05f|HDL`AuBRVeG*rE`1H
zr)LLo`K6KK=4(5O8FzGc-n;JU9%9#9y~K$v35~;@9f>(;L+(cZ%RigUTnP$S$X+P%
zLf@|%G9+Ef4_CamScP|wA3`zT(u{t{dA%6@q(ap-0pvvS#(44Nik{;2#j#@X^sZvk
z=xA|GVwC9GrM)vxi?%KeJ#N>bofvdUq?kFbvq*nDR_uMRcd+^LGi3O%sLDTIssrXh
zP<UV@Yph5A6@2v{v^aYCl~?3Bvx?HjsIb2yaWCuyjUygZoo@gqDn9QcvRC&MZvu~x
z&FCubzByV985AYDbqx*&v~~A&+&iv=m^`Mlc;m5HQL?E|u=sKue%Yh2CubY!j?Xua
zuaCIZty)Y_d<$cSr%QE^leD3sT&VjtLHw{jUVOehPQ3U~jF^SK(1;-&1z}J7E}?wf
zA+ntqeO)K9Jf*w%3AU}Fa*^C$3VU)t^Q3XOAj3Q2y$*~SzNf|E9plC=mR*my%Z2De
z{V36;3Ln*9Cx|`kdW%m|<HYiX-Ni$bx`?rV?j#2ODN=OosP_f5zu%DK_UIS&?cG5n
zUD;7g7!~dGD;}EIMJ$}!RrQ%Op^KPuYiH+s4ZA!_#KRZ4sJ(yhM)zGkFiI?$-A&}J
z>7|l|FIibAFM~Z<>WqDJAFEOOSj2%{yLX=tJXUBhN%MQ<d9aFC4^is$=;l7+i`U{r
z+JYD{1$~eH@QJDKu6bTSk2}M+zG^^}m@qP0JTk4Tv%m8de3L^T#f#c+{P(Mg*SYWX
z5^I;nibwD3>a-8!$J?z7wF6`uO9R^n`vp9Civ9S;w<nXQPJLX90razSr1?&$4a*yw
zLH;uJi?sIz>Nq;Oy}0r+7Y7#I>*BySh*43jO3BY)e?Pf3!5JHS_Wl@g)3A=V>|Z3}
zW|MD;7P)T+(5CE2JcM}Ht<v}*+n1o&7v!@(54b+2#Wwtt@zQ?Q(Qo7KyS;O*_IiJg
zFYeO;@zqXZ-rZfqE6LqO)+=$MXhXapKPA}M_viV?ze*4rUyKt|$95Lc(bnuF^}p`C
zF<NZ>N6*03DJSVGaU>IsMdP=pt?@Vix?sUfExwV5aX)-@>D=yKy<)d&uQxhw2Yg)i
z$4D`5M6`Gqwt(VOG+sei^9Q4$au2=#2ha6z#@RY`vc{F`u8a~NJ>Mfx{IA8>>$Boy
z$*)=?W*f84G|wG<s()!Qj{NV7Wbc9TlfP)MrQ@DG+KW->hb)-fRjm43cP9^yeG#-+
zXvpx3{IImY#)wP$T8qP7aapAJ?B%$?y#G$j0Xl-Y3T#V)(!cV^731eI!1z%O?rSh-
zYp~}U&tHmtrKhjD;i<oLD_yauyE9(<-%lFXHwYCwqIwVX3%9@COOVg>rv%?zx#8-L
z;$6f8PQlMnJ;(kyQVncLnlr}8JP8_4$mh`TgM9E3#JPU&;fCsO@#<mFYh43%+fZzT
z<o)DBWx}7LShGZ?s&oC|hrP2TR{XN9!8|#J`OkN$bi{lK7+=uO3d365kG1;5+!Nzm
zSosr|F+VW(->A(8PiQP?_*K4nLUU$v(gP6h${n*toG4(wBnWK-`dRJ44{bk-)*9X>
zZI@~)&cyuO97B8<;ieUyr*WE*L(O?YabcQY)8P2Up6N@a`U(POTHEg+p7noP8-n99
z;*L}nM>1o<j}y!h6FZ`44~Qo;<}Q)3_Z-E(*CW>Dw@mZKek0Wt^P|E2E$U|t7&!1t
zt^UyW%7Sk$&(pAP-XgzsslZNac?S99%Tr=RPt3vB%2|0lZbT<hggI-r<&uB*8_bX3
zjSqd6nb`|^I<C|eeP58AJX<PvT5q^(#Ae%iY=zuV%Bb?o1o0YTfR|#7NGog4ac9gY
zcz#}tsIfMGrW~=X)uQ5G?WB5Q`_W+g;gKu)S(7|EQv5x!e*OAb&o!#QRr%+@7g6VR
zXyy1<a>497VgEJE=QLZ>Li5hPm(PK8tx2SH2%N7gVE9*IThgvjKMS#|3<WowZ5++d
zLYY4A2|a`MiDqBKet*c_j_k|mE&gm0>!LZ(uO!EK#^5V4Z}C~o@9pGEms}p4z7~yr
zfDc7lj$j@8D~2*ZxMYG^TgheSemsqxtX|w*bnj;Dn@qVa{#)3J|25PBwN+L5zZPYg
z{V}KUUi7(^<FgWb6!$Z|N77F6_2%5dy28QWhbr$0@x?IaOES)%n94jb=Yg4g$}wl<
z@tNHWeG<|K+OBiF*mZGX0Jt#C$%X9$DJO<Hw}#6`9f7^+;=Pag5Rm>D=3+gfwIMjJ
zgfAkW`%_bK2J&=#WrhJR)AMKNo4v%nm>=wG&Lgd1Eckl<gW$p{$dPg+S)a#1^W>}Y
z<*|C^i(h;}TsIu+4d2#s1oM0ke7AFFq_jOcQE;yKZg3v+K+glEOlVye=CV20+iT@3
zJMJFSUaZ9YPvtXgf2VvJWt%ZrZ{By{a_jPePaXk2<Y{#V|0EZAO656fNC*Dqgl?Gr
zLp*L)p4CUBV$N^kCB|`GrJQLU$!%DtOmpf3FrU#Q+j7KHketOj2KZWYSz$ge?I%*F
z)E#}ty7eW7vOBosHrwr6h~wMe`sBe@{PmtLmh-Yuym#(hUBrLZ1}(=>3H*_6hPq?!
z*zRw^7kNy}4;<HE-TIY=a^9c(h`*R>?)T9enAPYHU3Z1~oD!u>Y3@6%C9^UQ>*r7V
zh|RCYiHv7^h{K=xvEGLK5%L$A3%0o+lNtJ1;TRX$q|~ST`(ez{lE>mHmt5|c*PA=m
z?Yw`%2ff7t*b2%iA(55t9F1*|t)TobM!!Q`pmoU4KNutK!TR<~`l|b9vG7gEMj732
zcs_T`d*FzEKN#kWUz|Z~@m%;F2ef*}xjdA$mGKJlk3dZ8b3+}qfIb!FL0R`q59hji
z@)@-9ksS}lxH#p~DuYj=lnv!Tp*1ASFt_9`<SR<(<$KK)J)iQb(mH<Svn+kj9kU8L
zY9rMh^Tak!U@N-7Uq7VPIp#Kgy?5{4`q;cuwkHaHjd@z1SkhNB;S0?T+4xcqXO5#7
zi}@ZY_b=r|q4^?|GmrX5G{5A2*pK1pTlt!|sFk_)nAY(6mG5QOh_|t(T|PHLsYm{9
zi7zx43%b#*7l9qwf_|7hrsY~Q;xpG=sB>s9`a!gowpR~p?K+KVkY7Q4t`y{~BOdsZ
zV@t~gqhrd^P5m+3a?Bm`DeTCZY)8yvRaWJL@%3w=BVEoPT6c(X6S=)E&7in%xozDw
zu}z^hupch#;l#NSE{)Dx?Qa>~uRTw`2l*hBpO0e2vfO;sccc6fw&hIzNNpwiBLT9L
zi0?kB)gK+tnLBs3A<s%P20(9BwsqG89HBnY({s8BS}QKAXRyyvUPj~{6EA}cTmIft
ziur#&(p~y)NysZ?B@U+3!=CAn8tN`UxM?lVhn+YReX4B|oKz$3JJ3)Lr5V>kFDG@n
zX#x&t-+}xJ%2##!@J`aUSyERiKJ8pbIfMuIkMhX{?Ynx8DYvQY_bC74NyH93*IE4g
zi`buhtD)|gBbIy+kNgm~Iv*U_FVRmqID!O%2K~9Bw40!>T8lcft7F^O(-;D^)0b*u
zr;>U}v1s)=nnR`KLS+E*g*`sAtMt9bV=ZE>{TwN^7-PTQP<KW;<?~YR&|ECUw7%D3
z1m{XOZrs@4P|ihZ*MJ|#nu;S7>-qb`-Nh|Qodn@l`~D3%rtyy<SZ_XgOtdr4JLSBh
zF$&7>8?5?L3_$kIw7-_X{CS(ddkXV{#~JF5xgh0&k-T6>E-<hoRj?z8M)zT_*OAbh
z^?9fP>VuUaw;hcc$na$M9PQ^rxw~l&3GF>a^Fo>=pD;K;^MGaV{~-2!u*nbC_4|`2
z8|scZVv8df8|e()lt}bLeJ$fPI{TCFX>5+X^@QB7mAtzOZ%QtZO*rs=6LG<youK_5
zC^xpO9*dDf$PbRx!5<mR95L_{Y_<{LK>~E6%MFin<%VPI^c#)Lkq@4Wm10PVE8@b9
z$X!KtAr!e_gmv=CX|F3~T|D1kz#J8$`%KQ)il5gT_W^8Tq_uMmYYgx3=tKDz{jaS)
zIC3X+)F?hX?N_VZ&&0!phq3<-%_paMR87)HGO!CK*p=d)V!PK5mgl7-pUdv^u#ebJ
zSYO5axCf{$07s^P8>f`~pzrY6cfn_mHf%#&K6|Nc{rQ6{^w((*s-Hf_ye0eot9^|5
z^NtO;hvH%sr`GC#_Mccb57XQ2K70GXgIHfBUppEg+!*4b1wJ3Sf<{9(x-oW~D?vXD
z$^H%cbXED$&i2Z#{`h(w=E)zSz2UVSq2rHV^eb0m8DhW2x--%#pO^ab*f)gs%r)Z3
z#fBUy+x$ngZ%1vnam*1NM<|X>dzflDLUY4tFG)XST!OxqaUX!WAmxG))=fB4j=q+0
zTU44s94YZbfBxvaMc=a@aW>ifVDh{Eg+1tP%h;9g;SWYS=ko@ABZIcX%@JK227jaw
zKD%*VOv+2MBk_Q3{jnX<VV=e(V<h>t{9a$RXV%Ni1A9C$lNaXpzNoeFbd0#xA&i|E
zuZOP6zW^NB&Kxn%iDE@QWGiHA8)-jyvN2Yk;k_n*;)iDX<}!QS!F)ys&Fuvzba5@5
zJA#<kO@=b1Jt_Chc*(09wh#8OtdQ4^H+qTqIK4kY=l=b!WsX#ck~LQw>dT-X!Pood
z3}RPF;6oMJ4($j1u!UG-CErhhWWMjg`<WvRw<BaLWNSxgeTl*Ps$%34cwZbq&JCJd
zT3vK5W8F8_{gn|oLOFxVwfvxC^uw0J))=qT*`ItbIMOKNh%K3mYo3zNAs9L+N*w%T
z*aqxt_>d@GorGLK9sJcZ-{(Jvz>&V-!x0%rkPG`YQ#(?;n&$pCyS0cR#<x?*iLy&3
zf9#9&x#3!A?mO9v-!`O;cz5mEMCeD_*Mc2+13EHZ6MZBz27Wu`q4m2j-rDY^J-I1A
z3g%%QAAidL+Ar*Yj30Dv_M|~Okn49XJ}dEAVe)wzW$I5+>WvM-1>ak5cVI{QLm!7_
zdO~b#3*x`$8_J9J=gA%Oacjf5ulmy5v4bDRi}f$`5R0dG6}Mo%qSc%d9zD>0iN1cv
zw4COgvaJb-twDS@3ORzl@aRVQ7h@zpzLc6e+)&oFm2JfS`3s>dS#JM^={Uq~Qx*1V
z+x1p2@jmh>Qoid+qobYsfXZUHN|{>uz7Y9VO!4nqHmAf-D@PdWjk#lsJLpS=!|#xe
zk&r%7_ALDNa6@?)uO1409&Vsc8;Xgb-A}pWK3^Uuo_iohOc)t$x__Y+{L8MPc_@^Z
zZuQ?{12uoS8uPV`=MgbSY;lCJj~MSP=uS3gOJKi+)!>nFY^y3i5<bbc=FSnCS4{Kl
zAHjV4vB=@x2jh1#JU8SV<&&fJhO{Pxd=kHM%lWn;!a4t;D*v~J?HY5$Hb+txF1!c2
z*X4{SJRr7`Y3h?uPSgB}%bEj6Xnrlt`*?kEtaBaKNUX=Qnvc;cH=?52iEEK3d-nJ)
zVmb0PZvCe`S5Q#pl{;n~^3NHMYcWS`a|Gk*G(TP%+k)Tz1N{0+P1~fRG+Nu<WceSA
z@J9HYGogzUv%dC>vdRJNb(C-7%FCjV`?|CE=cC<4`V+Cz5BcwApRbU2OZNG}pIpBO
zmrOI&7jwimN5FvuaG_AEfA{ez^u=bNzh&Gm{k*;(a2hgsO}DM=DIK>qs9(VQRDt>(
z$_x3@eA{bvPl%)6BAH5k?2^AXTo%ZC{ag6v%Z+r4xYuW2Z`~^2V}W#WqTn3op2*pK
zPZ_o8jdh-K@EX;lIi4pU$(HPPkKBYDrt<u=%p2SGL)pHdzcm6Fsx-jSVdMlJqP$-B
z{YYj!e8nc+8}Yqo<a0U<>J;)^B46nc^03<C$iXFl(dmY{(I9Sk<cab2fxwb<P72P~
zVV|of(cg;jT(A3EQ*jo2_h)VC(@KoS#x<{|#E5Gzk8+Mv&=?%;N7yf+gW;z)=G77o
zjXt!;PE+!We1DsHOi%FsZVm5O>9Fl?V`wZ9K1sF_CQ!B=*PwH3@(x9*qrs78kte&M
zT&6KZ+FRY|L%wz);>kvzymxww-57(U5A9<m8+)W2NVeWHC+SPxm&XL3X4th*Mm7RI
z$uc93;Qa9g$;s1b&50pTDzZDb^u4WYVb-Dzd=GnN$>hGlZoY?uOE@>91*{w5*TTJS
zpTwxY<s45eEG(4o*+b8#y~PTb+y@+mTpTzU*bdY)=TFk-`t8xZy(?FeMV{eZ%8}>6
zcy65q{Wk<Vt>s?Cx6a47`dV3=M&~ep>tM>FMH5Wtrc~x#h!_`*DTd^}3xUFQpq@kf
zvEL@it#zH<eMfS~zK?j8v5jYr1VlE}k3xTHGWDyBcmluVTkH*Ip5KhdOLipg4HS-A
z@^dKv+#loh^Iqm+?9*1gi_&gyEp2&I*OT%*nECGD&MCyW7J^Tw8@_9G(OF{8EZV!h
z+LoTJ_bcq-CxoB77CE|Q?NPR!oIyJhf585r#xX~>Apx-=9=yYMKOG!Mf!=Clx}$UP
z2?<|-OXllFE3&)6f8WR)F<F0xbtbZ0*tB<*Ex8q?PVnfD{{}CvrIaoDQhnij>@ng9
z&R0#JIdcy2NqL{{dr{gb&Ub3eksp!2ST?7U_NlYXk)1=g>*UUMBcOIeCSUmO=VG0%
zq3=%IL4RyldV2aG+5O&gm3il3T=8}2yV3XZv5c`M?1#OHeSx&?Py*JH9Q)kHKDwnD
zL%s55ZUmhhN?EU5wQ4Z>R9m$=R30M+_R)tQVW7-RH)Wf9fhYd}W;xEK;o}tSC8v}p
zeV=g$rXy;uGd%uoXbxgo#_QkA^ulEU;S<J7Zin7VwR%(>*I?Z7IgFW@uji@A?kMuc
zZZOofRZO&?>&RBf@?d|OW+MkS$Fc%~bJI57M_YomRlkF+Sf}8GuH8e~VH$ro^-U;l
zUzBz;;=y~ECoccw!)5xh^+DLjo%YSPB%>XPIlPXlar|>L4$*iCY{^~Vftf8K-y|Q`
z8Rv!|F4k0>0iH~T{zGP+i6txs$##vwe!$wcXT>5LdsdZZTxq5|E^9pgP(KR&sh6P7
zU$i<^9>d;bARgS_R5vtkav*swuvylW_-yLm{x|mT)#fgZk83Y1@AIBJ=3P@c`{*C=
zy@BTsV!`oP*DlR3q~OU3aA_$x^*d7?ROX!zAD(h)w^|?m?wj?#x{W>EYA`R0_ZA7U
zc7Xa^SYve)#!PY*oY3_ZP*!!v`0;62vuHkto_JF5$UKal>}%>ay|I6va&plcT%{ao
zjO6fV7URA99$aMF289@QTGPA2CvQV>F8Cfs>)t(jr&!kt^t;UW8lySFMQJyPokMpw
zHcp%J_om&}*&`?KUmN>N7s0RNSZ@fo1L#Mch4J+V&<2(%+d;{9Ydoo~JPka#6Y;Lx
zro?Sy{kCimh08CEv=+yr*g<JVVry!bn`>RclXKypzY1PR^KmKoLOglhf;|btz5&-^
zZdYbwVYR7#=bl^ie#ke-;bQ51_RM;wxnia@zBlHeTnr!nV+9|){RYiB^5b6sPdfRO
zQ)xyYj5DsagqI-2V}tqIIqAK0G9u1c`b`>F3gP|*zneTx2A(8R4o3|qbT~kHE#`i`
zh3otIlx10F9AaLnz)htk>@*{;jMVJE9*KO8mUEd_=3V4dcFdtBA9I)K=$$od5@}on
zJTRO`@8J;Uetn1W_^HLk#cgHJ@}4_ca<(X5IR-Xm4R~_AC2(c)t8u!vgL2JVs$21@
zQC`_F4?>a$zVw5BR3!RSG{$(s!v~YU$8qhe>o;t`MwoK@<ULRE;RDIZ@aGFGVJU=d
z%HaNyDvnUT?O(Q8m~&F_$YQTNe94Q;Lz+L}$sZ8!dJNn+X2K6IPS8jD5^?0Quqo#2
zPbfZInlS|X0KEyGG|M%Oseg^}*4rbSum54ePtO~>j``uE9c^aq!p@yLFNBSF&MHqZ
z9(e$~nzbAACVgU|y67B?InIGiX;x#7KVc1(cD#^sp!l?l+XwFUDU)V~53Y}k?=-gy
zxW6AfIpk?Gef&M?_UDIUjM98;jP?pB&A1Hf<X;5FN_^rh1o~b#T-{M+L;Cf>@@C)f
zRl#^_S@uJ#Pnsi-e$;64(S7hkiJu?l%$@rXY|44s=jo1XDozJihQg<R8+dE-9Nb2j
zPm}bq_N;>&=8Gd0+2`o$%r+yWeGPy0MSUpPl)0F@vd;!r4kO=0D&oWgY3_^9-!9AS
zgq(M?F#fm&*bA9G8B4HtuC~t0=2_Syp(5LNEQ9&dqWD5M2i~tnf9f4z#%Fw3fvZDP
zrcPam_?PdoN5V{1{)O;YW`HZ-gaTJC?W@k0bvts*S+F08KHCK5M~mWzQr|Qm1@>Vn
zIAFR~OTiImI}96?P5uqI0!P<EAGIp~0?hxKfH)Y9tsM1<OJDsSKgwzEPh~xNV_k^P
z_b6U{jivfokpW-RY<UEmat7wtkAO{i4;VV7#F4M>;L0xeEAzlLB%ZRs74lh%SC4>y
zp9XyH_lZ$IxFCDx6EnN1_(AphFZx}wYrW@+S6^$XPFCv8*ECyxC@}y(<@dn*12+8>
zk6p=uUHKdOZ~ehJ^Ej9XFO<u^C~cD1H6jDJ4BEaAZ#}8c1N7wzANd<9vJ;iE;qMmO
zKaXBp_+MJHwQ=Ldo(mT(nloU~pbcnmt&Gtt+vuY-2L|`g!gKm#Eb>gB_&Ql~nkd`c
z+u0Y}_uzBj%$MLyK<0(f-lSSvxDxw^dToWwPE}-^=S*(l81ShtuD{nNVoc?1#EQpZ
z?0pk(Cfy@mi$BfrNt#;;`!XMXOApu=<GoFlaz9yex+u%M#2FXMpO_9j`!(mK@Wb9Z
zek`8R)tnzy`M+X}u+6ZG0g4raD|fp66~nys8h&W;S%UlDrd&qgOCQ)P-|=G)Z)oq1
z;+5pXJOQ8o6L98dQ#%0LKzmqe-{=1SGaW}iWLGYHJ#$Hm0b1+$QflgGV0{hnSE0qA
zjpI^0;~ns2Hu*1juJPVN9-b)wR%Ew_-+wJ)%JVT_pW<ZS<5T0|O)c_ZY2RhKS&qfL
zu^(vb%EyfVhF}1gJ_Fdk0x{z!;otAn;?d@D4W6+B`6!-;t-2NQu~^GKzlS%~MQ30?
z&RFnfxF}pYPy73({3uEt-w;{wz04(F7yza_!5&P9U3eeZJgUW~AIHbRnQv&GJ~%T4
z{j$r@*ZYmH_n>m*3qMo)d$)`lx>g)se+A+Jx8pMh{k6xP`H_m!#_`@#jBhKr3e+|5
zFT%l>IP}HF!6vM5&k3_N)}qC?;<yyg%SOEHUBsrJLd@(w<OLszJ-IK#oaRp8#@RHt
zS#iCyuXV?`aZ3VKKYkALDbN@|f9y>3#|FU0%yq|*Ev;YC;@sk~E{*^jG(FID;^#3>
zf`tL{FUZCKw|CLHNc5$)0sAK{;$P=~`??Qv28IQzF8o~PNn>CDeWSC;&j4p8gEOhL
z_7S)bgfCM^`Scs34*VO;mBz*Z`Tl7Chof)y0C@8nc=I`U^OG-|;VH-Un;ZL``S+M7
zO^pHg;cda4zOXkV@tJ{G^Ahmq4fr>d1N=Yul!6<ZU^}eM)Az)R`LA~_MN{jTf1leK
z#sFi0F~AsL3@`>51B?O20AqkLz!+c*Fa{U{i~+^~V}LQh7+?%A1{ed30mcAhfHA-r
zU<@z@7z2y}#sFi0F~AsL3@`>51B?O20AqkLz!+c*Fa{U{i~+^~V}LQh7+?%A1{ed3
z0mcAhfHA-rU<@z@7z2y}#sFi0F~AsL3@`>51B?O20AqkLz!+c*Fa{U{i~+^~V}LQh
z7+?%A1{ed30mcAhfHA-rU<@z@7z2y}#sFiW6<`2Wl>BozXfGN0KQ3drXeGdy&`QL0
z+!S)DYis;2rezT(_xV{S!i}F9X<Sy<cA?>YbrEJ|S;qH;8<&ajf@JB9q`xqevW4Y|
zhWDA3WtB%7-j`KvTvqUaT)Fg~1@leH2FMji_my`rF01w^$)Uc6?yGJa=Bz`C!=ZX%
zDywxVFbm&Z7dfxQ4sBExk%FUgd{y7*Dua@$okb2MJgBTLJS(}@Rpf9ayB~-@R7MKS
z@{~nt%EHPAc#4z{b>6qIJjz>!$9VoZ%TnAg;=CZyQ{?)+toik~IqK!^ysto6R$mKO
z*&xMz^*`t=E00u`d4Et+7U_8zXIXXI6vd5RMM=uMFXJq$jmT2m=Y1JxSzUO6vMkyC
zgYGhy^4u4AUdCA_!c59k0`-E%bzh27XqqyWur*}`DuJrrQxqr#s;;{zk4$mDKmN4!
zP~7z{)orut%g%Nrx+?D~(+JI7d3TvwXl_`z%IegDacjv{Cc>0R^I+6nmQsr^-hXa3
z;h0`ZEi|_V-DO!S!MF+IE>j7{;jW;&tXzdAx3t}5)oR4JD(Eh&jVQo3?>}`}xC#}n
z%HvY1L!GSh?lR$!RNhmTvcUUe^o5?~;wJuPC92Ajm1PA=&ATh_xxZYgd3W>VDXWes
zz*p}-X9aOYj~2C(3VO<974($JD(Ed!SJ0_>Z<)G+>N0f&)n(-o1$c(%pOX_faMnRo
zt16L9C%t90N-eoS=q;;LYl$A}EfWrvmgvs<vJ|zJRApIeO(ZMtQ&)oETmMXTB?!Lt
zWwl`{IH}6&)GrF{*54-_suu-(6=hkGSvd0iQ<oJ)6nF~o7lOh6h5KK5xRUe`jH0Ys
z^`h!B&5Nq;6Al%&)n!?23-A-3f62<<69p>OC#uTIRWGA1t92xM9*Do{vN}g%N_}CZ
z>X{-%`7&+QWd%yfXv)eRb@k7TP~WF|8BJN8L!l;3nMjGKZ=S-{&lClU+H1?o6}1o3
z+*hmkL2a3E)c>HaEGx`gLtPnu&?{2S?}=JiF^_1pWx^5eMZT^qtG*VxvT{eH=b^f?
zT8CFpx-y)gbM!A69}nhTe+wLK-SXC#RXf7n)z_EdiSACGq%6zP*2O1D845&-{9Obd
z>UtZ=eWJj9qpS=9ZA(JM12pwREmLrgZkCmy?gT(-8J$cl(COVHH<TvJ@1wJZWh8B*
n`{-2-%b*GpkiLHOLe(Z^RBm)1m&xVHa$&g;2DJYgz@z^Mj&BAt

literal 3870
zcma);c{J4h9>;%nil|2-o+rCuEF-(I%-F}ijC~o(k~HKAkr0)!FCj~d>`RtpD?8b;
zXOC1OD!V*IsqUwzbMF1)-gEDD=A573Z-&G7^LoAC9|WO7Xc0Cx1g^Zu0u_SjAPB<A
z`RksU20=ur5rmib*S!+l%h4eS4)^Q+0X>3vGa^W|sj)80f#V0@M_CAZTIO(t--xg=
z!sii`1giyH7EKL_+Wi0ab<)&E_0KD!3Rp2^HNB*K2@PHCs4PWSA32*-^7d{9nH2_E
zmC{C*N*)(vEF1_aMamw2A{ZH5aIDqiabnFdJ|y0%aS|64E$`s2ccV~3lR!u<){eS`
z#^Mx6o(iP1Ix%<jZ{9b!^*}EvPeMb_W#+3mPDk@<s^Oh#VM&a2^K;|820}`)peR}+
zJXt@j)V#7+Js?u;Lb#g$HH)e~Ro^hvl6KSLHq)Y3adj<OOD7?;gwee^gNzCxwD?IA
z8?*}E@b*IiVPUPv3?XqzLRv|{4)GKGzjS`)#ukL7W&K6BHn&1}P(skc69cJ?5^C+V
z@yyqLJg;V2Ul%gZ*?2WiB%bNfz1}F^UeTpW^N?dSY@NL3zDD+Tzk$Cg_=cj!M^ot0
zu%qYEoTU9K@kMP2H52_@<2On}lNX!oZ(oWk^?eSfXAa3M8S?8tzISV2V&9A+_-47Y
z>4dv`t@!&Za-K@mTm#vadc{0aWDV*_%EiGK7qMC_(`exc>-$Gb9~W!w_^{*pYRm~G
zBN{nA<l~YIv(*f3@JAyAZDXwp4d;meFk*lN;rx5VQze6aK!n?W9`Uc4pES2K&V3BC
zkTJK{PcIXdQ?hM;i7~K{wRSeU-w9_32aC}+7nN6r5o<=I@CyjQAS~;jsb7p#@eUT2
zkh1M~1>;cm^w$VWg1O^^<6vY`1XCD|s_zv*g*5&V#wv&s#h$xlUilPe4U@I&UXZbL
z0)%9Uj&@yd03n;!7do+bfixH^FeZ-Ema}s;DQX2gY+7g0s(9;`8GyvPY1*vxiF&|w
z>!vA~GA<~JUqH}d;DfBSi^IT*#lrzXl$fNpq0_T1tA+`A$1?(gLb?e#0>UELvljtQ
zK+*74m0jn&)5yk8mLBv;=@}c{t0ztT<<S2g5CX`xuBQVwYJOMIsv7paOX6ypYJL$a
zJ|Vy}#?V4i+kjXzBq)LcuJEA=z^Z2W4WQ1U@0}*!;_q<!3_ls8PhMM3ii*Ci+cF6=
zF!@E<x#%Yvb!P0>v;Avck$S6D`Z)^c0(jiwKhQsn|LDRY&w(Fmi91I7H6S;b0XM{e
zXp0~(T@k_r-!jkLwd1_Vre^v$G4|kh4}=Gi?$AaJ)3I+^m|Zyj#*?Kp@w(lQdJZf4
z#|IJW5z+S^e9@(6hW6N~{pj8|NO*>1)E=%?nNUAkmv~OY&ZV<PHdt%yO<W_%O|c-T
zC%nAvgv?#h>;m-%?pQ_11)hAr0oAwILrlsGawpxx4D43J&K=n+p3WLnlDsQ$b(9+4
z?mO^hmV^F8MV{4<aA#E-8o{y-by8hR1>Lx>(Q=aHhQ1){0d*(e&s%G=i5rq3;t{JC
zmgbn5Nkl)t@fPH$v;af26lyhH!k+#}_&aBK4baYPbZy$5aFx4}ka<ge$nBI}>&qxl
z$=Rh$W;U)>-=S-0=?7FH9dUAd2(q#4TCAHky!$^~;Dz^j|8_wuKc*YzfdA<NJp8x7
z`_}_7!m44CG`<6nLk0r3A}8e>ht@Q&ror?91Dm!N03=4=O!a)I*0q~p0g$Fm$pmr$
zb;wD;STDIi$@M%y1>p&_>%?UP($15gou_ue1u0!4(%81;qcIW8NyxFEvXpiJ|H4wz
z*mFT(qVx1FKufG11hByuX%lPk4t#WZ{>8ka2efjY`~;AL6vWyQKpJun2nRiZYDij$
zP>4jQXPaP$UC$yIVgGa)jDV;F0l^n(V=HMRB5)20V7&r$<L^Phf(W29K>jmk{UUIe
zVjKroK}JAbD>B`2cwNQ&GDLx8{pg`7hbA~grk|W6LgiZ`8y`{Iq0i>t!3p2}MS6S+
zO_ruKyAElt)rdS>CtF7j{&6rP-#c=7evGMt7B6`7HG|-(WL`bDUAjyn+k$mx$C<FS
ztTQ#rrhaxTX7@2TN#`pson<p6thk-4?N)^;_(Up!_V=f}<~kR)zD%o0iiqseIMZqh
zGU`kZGbN)qs{;AuZP?~%PajDo&b&7)!V!+|VO<ediN}{)OvR~sQ<ZYe%O|)8-DTKw
zTXmYP$VLa(Y>H;q2Dz4x;cPP$hW=`pFfLO)!jaCL@V2+F)So3}vg|%O*^T1j>C2lx
zsURO-zIJC$^$g2byVbRIo^w>UxK}74^TqUiRR#7s_X$e)$6iYG1(PcW7un-va-S&u
zHk9-6Zn&>T==A)lM^D~bk{&rFzCi35>UR!ZjQkdSiNX*-;l4z9j*7|q`TBl~Au`5&
z+c)*8?#-tgUR$Zd%Q3bs96w6k7q@#tUn`5rj+r@_sAVVLqco|6O{ILX&U-&-cbVa3
zY?ngHR@%l{;`ri%H*0EhBWrGjv!LE4db?HEWb5mu*t@{kv|XwK8?npOshmzf=vZA@
zVSN9sL~!sn?r(AK)Q7Jk2(|M67Uy3I{eRy<vjA)m;~)jV3DFGzL)eNbs@Sy80roD>
z_l&Y@A>;vjkWN5I2xvFFTLX0i+`{qz7C_@bo`ZUzDugfq4+>a3?1v%)O+YTd6@Ul7
zAfLfm=nhZ`)P~&v90$&UcF+yXm9sq!qCx3^9gzIcO|Y(js^Fj)Rvq>nQAHI92ap=P
z10A4@prk+<s7nQxb0&o?puD0BStB$NLIA{pVg<pW;2=HJ11ZpVkRkF89w0s#3ef?(
zka>AGWCb`2)dQYFuR$|H6iDE8p}9a?#nV2}LBCoCf(Xi2@szia7#gY>b|l!-U`c}@
zLdhvQjc!BdLJvYvzzzngnw51yRYCqh4}$oRCy-z|v3Hc*d|?^Wj=l~18*E~*cR_kU
z{XsxM1i{V*4GujHQ3DBpl2w4FgFR48Nma@HPgnyKoIEY-MqmMeY=I<%oG~l!f<+FN
z1ZY^;10j4M4<Vo=b&OyEfF!Y);yDCJas8bbVhK~blk}<IGME~h)6n~gdmqP>#HYXP
zw5eJpA_y(>uLQ~OucgxDLuf}fVs272FaMxhn4xnDGIyLXnw>Xsd^J8XhcWIwIoQ9}
z%FoSJTAGW(SRGwJwb=@pY7r$uQRK3Zd~XbxU)ts!4XsJrCycrWSI?e!IqwqIR8+Jh
zlRjZ`UO1I!BtJR_2~7AbkbSm%XQqxEPkz6BTGWx8e}nQ=w7bZ|eVP4?*Tb!$(R)iC
z9)&%bS*u(lXqzitAN)Oo=&Ytn>%Hzjc<5liuPi>zC_nw;Z0AE3Y$Jao_Q90R-gl~5
z_xAb2J%eArrC1CN4G$}-zVvCqF1;H;abAu6G*+PDHSYFx@Tdbfox*uEd3}BUyYY-l
zTfEsOqsi#f9^FoLO;ChK<554qkri&Av~SIM*{fEYRE?vH7pTAOmu2pz3X?Wn*!ROX
ztd54huAk&mFBemMooL33RV-*1f0Q3_(7hl$<#*|WF9P!;r;4_+X~k~uKEqdzZ$5Al
zV63X<s4EnR@itBNL^suG_KHV!zgrw6&Bq&`dNv>N<k2!6lBSoSAvQBw$a}{Sg*d5f
zJqeF6lxH}v-(s5jl(8V8Bv*((#aw(*iLTd8#?8FnMLG#}AorDTkK*%$ni#S{e-*jA
zjy$_xALPmR?$A)F?XdsKy|!Ue+lIR5=csS!ZPu7h{Nc+Sd%?*WHR`S5ByDdhQAsNO
zeyx0!D+fx-a_t<57fQ^<7*WTVDog0}WA0F2_h++_I?f`i|C>@)j$FN#cCD;ek1R#l
zv%pGrhB~KWgoCj%GT?%{@@o(AJGt*PG#l3i>lhmb_twKH^EYvacVY-6bsCl5*^~L0
zonm@lk2UvvTKr2RS%}T>^~EYqdL1q4nD%0n&Xqr^cK^`J5W;lRRB^R-O<zOhVxo?8
zb#fjP=~|*nH<rZsU&F20QcP*BR|)$r#sFFtYi6hV=2&f<YJ%JC0IAdIRdHjO(;S%3
zC;L{EqcHO368@u|<ql>8b&HENO||mo0xaD+S=I8RTlIfVgqN@SXDr2&-)we--K7w=
zJVU8?Z+7k9dy;s;^gDkQa`0nz6N{T?(A&Iz)2!DEecLyRa&FI!id#5Z7B*O2=PsR0
zEvc|8{NS^)!d)MDX(97Xw}m&kEO@5jqRaDZ!+%`wYOI<23q|&js`&o4xvjP7D_xv@
z5hEwpsp{HezI9!~6O{~)lLR@oF7?J7i>1|5a~UuoN=q&6N}EJPV_GD`&M*v8Y`^2j
zKII*d_@Fi$+i*YEW+Hbz<W=zs^XxM$!;??OHDS{MUEdOi9{rF;;#a0RO>n{iQk~yP
z>7N{S4)r*!NwQ`(qcN#8SRQsNK6>{)X12nbF`*7#ecO7I)Q$uZsV+xS4E7aUn+U(K
baj7?x%VD!5Cxk2YbYLNVeiXvvpMCWYo=by@

diff --git a/ui/public/index.html b/ui/public/index.html
index 0050dcf77..d0bc57b87 100644
--- a/ui/public/index.html
+++ b/ui/public/index.html
@@ -9,7 +9,7 @@
       name="description"
       content="Feathr Feature Store Web UI"
     />
-    <link rel="apple-touch-icon" href="%PUBLIC_URL%/logo192.png" />
+    <link rel="apple-touch-icon" href="%PUBLIC_URL%/logo200.png" />
     <link rel="manifest" href="%PUBLIC_URL%/manifest.json" />
     <title>Feathr Feature Store</title>
     <script src="%PUBLIC_URL%/env-config.js"></script>
diff --git a/ui/public/logo192.png b/ui/public/logo192.png
deleted file mode 100644
index fc44b0a3796c0e0a64c3d858ca038bd4570465d9..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 5347
zcmZWtbyO6NvR-oO24RV%BvuJ&=?+<7=`LvyB&A_#M7mSDYw1v6DJkiYl9X<guIKOG
zci*|^ymP*p?>jT!%$dLEBTQ8R9|wd3008in6lFF3GV-6mLi?MoP_y~}QUnaDCHI#t
z7w^m$@6DI)|C8_jrT?q=f8D?0AM?L)Z}xAo^e^W>t$*Y0KlT5=@bBjT9k<?nGGBhQ
zSbehEe6l@wQk?yk{Pz@AcMVld0M;GTCE?4p`2*7=c-2|99C89m^UO&?Z>xb%-KNdk
zeOS1tKO#ChhG7%{ApNBzE2ZVNcxbrin#E1TiAw#BlUhXllzhN$qWez5l;h<YdrI9P
zS<6GhD3leYXm+LY=TY4I>+t^q#Eav8PhR2|T}y5kkflaK`ba-eoE+Z2q@o6P$)=&`
z+(8}+-McnNO>e#$Rr{32ngsZIAX>GH??tqgwUuUz6kjns|LjsB37zUEWd|(&O!)DY
zQLrq%Y>)Y8G`yYbYCx&aVHi@-vZ3|ebG!f$sTQqMgi0hWRJ^Wc+Ibv!udh_r%2|U)
zPi|E^PK?UE!>_4`f`1k4hqqj_$+d!EB_#IYt;f9)fBOumGNyglU(ofY`yHq4Y?B%-
zp&G!MRY<~ajTgIHErMe(Z8JG*;D-PJhd@RX@QatggM7+G(Lz8eZ;73)72Hfx5KDOE
zkT(m}i2;@X2AT5fW?qVp?@WgN$aT+f_6eo?IsLh;jscNRp|8H}Z9p_UBO^SJXpZew
zEK8fz|0Th%(Wr|KZBGTM4yxkA5CFdAj8=QSrT$fKW#tweUFqr0TZ9D<AY0)k`aBx_
z>~a5lF{)%-tTGMK^2tz(y2v$i%V8XAxIywrZCp=)83p(zIk6@S5AWl|Oa2hF`~~^W
zI;KeOSkw1O#TiQ8;U7OPXjZM|KrnN}9arP)m0v$c|L)lF`j_rpG(zW1Qjv$=^|p*f
z>)Na{D&>n`jOWMwB^TM}slgTEcjxTlUby89j1)|6ydRfWERn3|7Zd2&e7?!K&5G$x
z`5U3uFtn4~SZq|LjFVrz$3iln-+ucY4q$BC{CSm7Xe5c1J<=%Oagztj{ifpaZk_bQ
z9Sb-LaQMKp-qJA*bP6DzgE3`}*i1o3GKmo2pn@dj0;He}F=BgINo};6gQF8!n0ULZ
zL>kC0nPSFzlcB7p4<H52f8=qMn2=dQ!;xXD`6jdiBJ2^oNyt+16A(f<i;0;6ddGE;
zQ_@XTca6wSK(vK5KIKHUgO;P>1doao2F7%6IUTi_+!L`MM4o*#Y#0v~WiO8<L#fHx
zI?x?k(&T-}!n%}LcF+uCp*>uSeAUNp=vA2KaR&=jNR2iVwG>7t%sG2x_~yXzY)7K&
zk3p+O0AFZ1eu^T3s};B<g5t4vVJN7*?kWOGhv$ru8HW)vzo*&RaaqNEl3s?|)YGKH
zo63kVeX8eiiI8)8TVI<9KtqUE{ofuaw7$nnPUt#2l$=IC;iDij;8{QXU+uLWA9c~M
z?KiTNfE|~IwacG?sFBRbqY&vgc~Yaopzd0{Lg`-WSBW2a@&8=tG<r`Ob?)2siT;lG
zPzbHtt{(VS9*a_>%6TpJ6h-Y%B^*zT&SN7C=N;g|#dGIVMSOru3iv^SvO>h4<o1)Q
ztk-z{yw|{Hc59vTba3&#6I)4@Z!Z{_&vNhxwseBQJk-micCb@PRsZ-yUF*D=BME?9
zv0H77d40W7BL-#9+(qd9=V7!I>M=t-N1GSLLDqVTcgurco6)3&XpU!FP6Hlrmj}f$
zp95;b)>M~`kxuZF3r~a!rMf4|&1=uMG$;h^g=Kl;H&Np-(pFT9FF@++MMEx3R<rS-
zuB^adWYC5}jnG`RBeLHUV`KdbUu)vW8p$<wk-gJklNpkTMH8;qgxUtn=hQw+aXu!!
z7L<V8=#FBERK(Iy;KSCGArNoBxI|R+%WaYJr`}%uyfu_sJ6N4<E%!ST6&8KTNUgT0
zc=|z>BsK?AU0fPk-#mdR)Wdkj)`>ZMl#^<80kM87VvsI3r_c@_vX=fdQ`_9-d(xiI
z4K;1y1TiPj_RPh*SpDI7U~^QQ?%0&!$Sh#?x_@;ag)P}ZkAik{_WPB4rHyW#%>|Gs
zdbhyt=qQPA7`?h2_8T;-E6HI#im9K>au*(j4;kzwMSLgo6u*}-K`$_Gzgu&XE)udQ
zmQ72^eZd|vzI)~!20JV-v-T|<4@7ruqrj|o4=JJPlybwMg;M$Ud7>h6g()CT@wXm`
zbq=A(t;RJ^{Xxi*Ff~!|3!-l_PS{AyNAU~t{h;(N(PXMEf^R<?TfDfq&c>(B+ZVX3
z8y0;0A8hJYp@g+c*`>eTA|3Tgv9U8#BDTO9@a@gVMDxr(fVaEqL1tl?md{v^j8aUv
zm&%PX4^|<cvLF*HzSDMGV0iHPD$KT$lv#8;LIw%pD|^3Sh^Dv=f=y*RKZlzMkH(pA
zj!TBU#${|io0kf9sBt#c(IUh^Nw?i5pPmkQDL8Jo`ihi{POC*hzPF#9gJ%+*%r~)G
z*hzHaRQu;^GSmtSWXj1<&y{<D%B-d(ca1<IOKZoU>rX|?E4^CkplWWNv*OKM>DxPa
z!RJ)U^0-WJMi)Ksc!^ixOtw^egoAZZ2Cg;X7(5xZG7yL_;UJ#yp*ZD-;I^Z9qkP`}
zwCTs0*%rIVF1sgLervtnUo&brwz?6?PXRuOCS*JI-WL6GKy7-~yi0giTEMmDs_-UX
zo=+nFrW_EfTg>oY72_4Z0*uG>MnXP=c0VpT&*|rvv1i<G)%__T#O;}Vf68{=uDg!&
z$^|uGJ##zrX6I7v^ea{ysV}DJ_zrf_yt8+T?W6jw=&>StW;*^={rP<Gps5k_;Ey{*
zO|;e5vGXQ@h1vJKGQ+`NMmYBKV~Sx1US+h>1y?Hv+6R6bxFMkxpWkJ>m7Ba{>zc_q
zEefC3jsXdyS5??Mz7IET$Kft|EMNJIv7Ny8ZOcKnzf`K5Cd)&`-fTY#W&jnV0l2vt
z?Gqhic}l}mCv1yUEy$%DP}4AN;36$=7aNI^*AzV(eYGeJ(Px-j<^gSDp5dBAv2#?;
zcM<nu%TB#lev5kX<apfcKZZ%hDDU3kXtK*%;R839$alV38VWT{NJnhjF0GL`9rM2k
zVexf3KgbIO)>Xv#aj>%;MiG^q^$0MSg-(uTl!xm49dH!{X0){Ew7ThWV~Gtj7h%ZD
zVN-R-^7Cf0VH!8O)uUHPL2mO2tmE*cecwQv_5CzWeh)ykX8r5Hi`ehYo)d{Jnh&3p
z9ndXT$OW51#H5cFKa76c<%nNkP~<gM?)^OX$gL^Ky|we;1(h|2M#l;#h2Tj`PPB<E
z!n=Eb`hcI+66~)eT{SBi;R$mV2KtH}>FU93b5h-|Cb}ScHs@4Q#|}byWg;KDMJ#|l
zE=MKD<?0c>*F@HDBcX@~QJH%56eh~jfPO-uKm}~t7Vk<jf*+P>HxHT;)4sd+?Wc4*
z>CyR*{w@4(gnYRdFq=^(#-ytb^5ESD?x<0Skhb%Pt?npNW1m+Nv`tr9+qN<3H1f<%
zZvNEqyK5F<KUONUP{U|Z&`@-OcU{=Mb%iZGj^d}>gPsQ`QIu9P0x_}wJR~^CotL|n
zk?dn;tLRw9jJTur4uWoX6iMm914f0AJfB@C74a;_qRrAP4E7l890P&{v<}>_&GLrW
z)klculcg`?zJO~4;BBAa=POU%aN|pmZJn2{hA!d!*lwO%YSIzv8bTJ}=nhC^n<w3-
z-v~(ZP6zhLQOa--Vj)F~k0Ob}euB(Y8{v*v$;WjNYg|Cj9;VkDLv+N+V{aW7CW=3<
z$l$KzIhY7gI#*j8`VKQqt@ea1=E#0c5IVICnVAH{bp_LL1iIVw*Itgfi#Sq7_Q<98
zA1cq2BqF{g9$p1@&gq>}g(ld^rn#kq9Z3)z`k9lvV>y#!F4e{5c$tnr9M{V)0m(Z<
z#88vX6-AW7T2UUwW`g<;8I$Jb!R%z@rCcGT)-2k7&x9kZZT66}Ztid~6t0jKb&9mm
zpa}LCb`bz`{MzpZR#E*QuBiZXI#<`5qxx=&LMr-UUf~@dRk}YI2hbMsAMWOmDzYtm
zjof16D=mc`^B$+_bCG$$@R0t;e?~UkF?7<(vkb70*EQB1rfUWXh$j)R2)+dNAH5%R
zEBs^?N;UMdy}V};59Gu#0$q53$}|+q7CIGg_w_WlvE}AdqoS<7DY1LWS9?TrfmcvT
zaypmplwn=P4;a8-%l^e?f`OpGb}%(_mFsL&GywhyN(-VROj`4~V~9bGv%UhcA|YW%
zs{;nh@aDX11y^HOF<O&mcM-|{L00A>XB$a7#Sr3cEtNd4eLm@Y#fc&j)TGvbbMwze
zXtekX_wJqxe4NhuW$r}cNy|L{V=t#$%SuWEW)YZTH|!iT79k#?632OFse{+BT_gau
zJwQcbH{b}dzKO?^dV&3nTILYlGw{27UJ72ZN){BILd_HV_s$WfI2DC<9LIHFmtyw?
zQ;?MuK7g%Ym+4e^W#5}WDLpko%jPOC=aN)3!=8)s#Rnercak&b3ESRX3z{xfKBF8L
z5%CGkFmGO@x?_mPGlpEej!3!AMddChabyf~nJNZxx!D&{@xEb!TDyvqSj%Y5@A{}9
zRzoBn0?x}=krh{ok3Nn%e)#~uh;6jpezhA)ySb^b#E>73e*frBFu6IZ^D7Ii&rsiU
z%jzygxT-n*joJpY4o&8UXr2s%j^Q{?e-<G_^{J76Mq?|eHl2Q}TIfLz1H}I9fvS=c
zm*oIlbD9$tAnOWfM^xYqm2?aavV7kSFN~t(hX*&jXwdT)(-yUc1(^4$bB@D*Rg4fF
zGv*BCBqRz8`^LRBWj98zY@aQ`B||0ovS-9b;m0T<TXj-Hh5;G|U%0o&CSKp)@EmW@
zChzrZU(8@!L%c_f>voloX`4DQyEK+DmrZh8A$)<mmOk^JRtKa)h*12TXYBu6*SOO3
ze#NvXs$UpPLNJLqoTpKTRV%K2qK9}L;hCtucS=cqUWJH}3K=Em3K@4&JHx{iSFa8E
zqVHD4$k0g3oTIYd{?wVF<(2=uTWaH@w6)NT<>iWL#NO9+Y@!sO2f@rI!@jN@>HOA<
z?q2l{^%mY*PNx2FoX+A7X3N}(RV$B`g&N=e0uvAvEN1W^{*W?zT1i#fxuw10%~))J
zjx#gxoVlXREWZf4hRkgdHx5V_S*;p-y%JtGgQ4}lnA~MBz-AFdxUxU1RIT$`sal|X
zPB6sEVRjGbXIP0U+?rT|y5+ev&OMX*5C$n2SBPZr`jqzrmpVrNciR0e*Wm?fK6DY&
zl(XQZ60yWXV-|Ps!A<n+?vbcQJG{k7=<p3~`+h4Kd_>{EF;=_z(YAF=T(-MkJXUoX
zI{UMQDAV2}Ya?EisdEW;@pE6dt;j0fg5oT2dxCi{wqWJ<)|SR6fxX~5CzblPGr8cb
zUBVJ2CQd~3L?7yfTpLNbt)He1D>*KXI^GK%<`bq^cUq$Q@uJifG>p3LU(!H=C)aEL
zenk7pVg}0{dKU}&l)Y2Y2eFMdS(<j~2+yHkUVn{?C5dsJXag$OUKP&Vl2lSAJL_uI
ztevY_DRGdi^2bgn=Ll@Km6Uk>JS0}oZUuVaf2+K*YFNGHB`^YGcIpnBlMhO7d4@vV
zv(@N}(k#REdul8~fP+^F@ky*wt@~&|(&&meNO>rKDEnB{ykAZ}k>e@lad7to>Ao$B
zz<1(L=#J*u4_LB=8w+*{KFK^u00NAmeNN7pr+Pf+N*Zl^dO{LM-hMHyP6N!~`24jd
zXYP|Ze;dRXKdF2iJG$U{k=S86l@pytLx}$JFFs8e)*Vi?aVBtGJ3JZUj!~c{<R$n(
ziv;4$OAR*24{KJ-u{Mz2C%|m?Lu8%akP2m-8t9?^hJ};KWux0$T6Zc6vmNj_(P^97
znxN8^Fl+G8f)9)fW?Qt`NcWoFLaagnygy3@TZ@Gu-ER?^vZ;^CT6NUUf@sIN!o*#I
zTQDxUq9IS<Y5j7ng8Y<xvPo+D=~nKpr2LflB|zg+Vlqg|&Z#IWz8CdW!h`-uDggJR
z+f9qRnZ^{3x$+Kifl~IZh)$X4>(rw5>vuRF$`^p!P8w1B=O!skwkO5yd4_XuG^QVF
z`-r5K7(IPSiKQ2|U9+`@Js!<HL1C{aO{H=}S{3p}_Edej>g6sfJwAHVd|s?|mnC*q
zp|B|z)(8+mxXyxQ{8Pg3F4|tdpgZZSoU4P&9I8)nHo1@)9_9u&NcT^FI)6|hsAZFk
zZ+arl&@*>RXBf-OZxhZerOr&dN5LW9@gV=oGFbK*J+m#R-|e6(Loz(;g@T^*oO)0R
zN`N=X46b{7yk5FZGr#5&n1!-@j@g02g|X>MOpF3#IjZ_4wg{dX+G9eqS+Es9@6nC7
zD9$NuVJI}6ZlwtUm5cCAiYv0(Yi{%eH+}t)!E^>^KxB5^L~a`4%1~5q6h>d;paC9c
zTj0wTCKrhWf+F#5>EgX<cLYfrtsHC5;@&1Tu=KIwHE|R;*1f&W24i_&2yx+Xe5N7V
z`hmH?m*G_>`sl%POl?oyCq0(w0xoL?L%)|Q7d|Hl92rUYAU#lc**I&^6p=4lNQPa0
znQ|A~i0ip@`B=FW-Q;zh?-wF;Wl5!+q3GXDu-x&}$gUO)NoO7^$BeEIrd~1Dh{Tr`
z8s<(Bn@gZ(mkIGnmYh_ehXnq78QL$pNDi)|QcT*|GtS%nz1uKE+E{7jdEBp%h0}%r
zD2|KmYGiPa4;md-t_m5YDz#c*oV_FqXd85d@eub?9N61QuYcb3CnVWpM(D-^|CmkL
z(F}L&N7qhL2PCq)fRh}XO@U`Yn<<Z#)X^Ij=#WjXr&snbL8Hbkya6{c!+Ay;w1Jlr
z9}X^@zhtUU>?TNGR4L(mF7#4u29{i~@k;pLsgl({YW5`Mo+p=zZn3L*4{JU;++dG9
X@eDJUQo;Ye2mwlRs<JiGX2Jghdw)}T

diff --git a/ui/public/logo200.png b/ui/public/logo200.png
new file mode 100644
index 0000000000000000000000000000000000000000..254621fb036e81eb2cff6cc6fa7eb1a956640796
GIT binary patch
literal 10726
zcmd5?WmjBHx5V9pdvJGmhXjY<?gS0)t^oqUo!|s_m%$0{?hxFA3=DS9^ZttaVa{3e
zWv^amSJ$qp?(b?U^5`hUC{R#P=${m1G=TS?|9(gaz_VJnCJzdVvHFvY<QMOp^IT+I
z%@N2uNKf|z4ncV6PGo543X@i!)0SO?etpZL_hv_k`LaRpTh(Uo5?gEPjDfRrW$311
zSaXX$`)@77&&Q5m@!%q2Vr0}LJ~Auf{0nledzDU04yVETCN@1#G?6K26YM`dA$&Xa
z+~6TZh6ES-HKThI8m2GxBg{uETgv~J4^yxwA`+YdBOBWxb85`2dA&DW@Xp-a9A%~w
zUsKJc{!9ca!3#7R8VZU~Zfa^b6_xo5ykFiBB~d9-O^mJ~M@3T;j|Np@95X8`da6Q&
zydq5!CzMlTX@HvAj7$CF(ewEUEH+ZXa(PwNolwwQ!uOJrlGfOvy>;58(;J-cG&oSx
zQwC?QZnrN~RKxu4U<At;*<<x$4aUl<D)$^+mOLi>*ee!h<{wF;maVYgy!!VEfi=3y
z3_iYlf)QjW;mS0Oj4pgMk>=ycMP1*4)n3B%dd%%-L3?|!{T#I{fQptt>Q0a<FilOt
zO<-nYi)UiNRb^*m%hT1-A;9RJgl=`dzP+vd2L^*ki3E44(#NZbdF>YPFrqYt?Y{ic
z0^Vg`n0zor?{-qBe#FGahF$nDU?cUh-9@?^8yj~4-=MLo>f9J{1$|P4yp~2pq>zS=
z?yxmFI$Bdwvd;<|8(TSzSX*1$4sE=KX<f?IdB-{30IQh)a$M_L%eF7}pX4r1kpHOJ
z>~=Czxao(*#l=hW`p25Cu8q}*h&?^7Oovdi*7<AiE^f_Ir6)!%S1Cy)rHS(E>u6W8
zU$xB-2)xzbY8?lTUGatu-7t~)yNpjR#INpSGi-E?i+ewl^(vqY61aouVLs{>cXX_s
z^@dO!UasE$$Ol#p4JEeOr6uj{{aBxo@pTWV*`JY-u^ko`rnSV!mPFlV81W~THN(9f
z{zEM8466CvuU{6qOLj);IX}(CfVLW>q@_U)4-STp4i2U|8BuDTHcH=0DdR^52Xng4
zYC2Wj+BZDyiPI`~-eXDU1JkKXThKo+XK`Zpns)GY;76zv4Q$Rkyt*-MIF(b#P=<qk
z*VG&y{*5LdAH`-(R-l=O*3Bp&nZ?J&E&j#yN=QNic64`FBKkGm+BU1bjnJxrR~Yj*
zL%X1VfeOA9hS16WeI1Xhhzr3B$|yPC6;HryOD(HX0?rk+NR5FKKb9I5b;u<OlOoGy
zw?E<;DkJECm^wBtZXp5dX?B)VTs4EE;Lr9pD56F(fMmr+D_WpT>WdcYr9fqW@pyF`
zEY!%>ud-L)AL>N*3RsRL5%|=1u%+#1GL)^90IH>XAgANuug_rC^ij(qhp*%NH=oTd
zEWq;es?Q(!_*!O&!#Wh=XJuU{{&a^#v9+2bKsk2?LUG&H8u2k%z{fW&Or&2@VgF$b
z{leriJ&G-wl1%N}05nO`;DOFtWGhq9ZLf7Yo8Q?+X`(4M?R1>?+qxH-Tg=~RVY-N|
z!1_l<54g1~MLDbUe9k7vJIyMFELudWpMmkZhFD3dsrMUwVLsz5-K@d``!_Mb!raU)
z_8$g^hhNRg1KUwr$?W^jU+6@>%*JJ6tYFp?DSP;&UlGAZ2J_BLYjCg0!UCnDzc5(=
z-Jbk2wUzTlTl=97J;-Ks0CRdBhl1kW%E2K=mjA{T55{X*T8&|#aE)(cb^R!IfndDD
z{|evSCzfs^+f|hl6<a~Pu&HT*U)b+<-p9x16W<Cxzx8CHT#RFVeZBb2lm8mOUEl{f
zyirbe5b~}4`tL=$bOHA=$13^f<_b2e%U#W?ub(@mRpI7F5<izXt*+`NIIXvMC>t5&
z4tcz08|rm=kCr8fzYQJ&dr+t&#@CMugbco_klz!;BlrAik~;8J@U2=sb7VolK8x7k
zA(s;7r09!|4(8azgl=AP@~sFIq<I2kt$$zuq^O{qM@B;8m*I5(sRo)Fgv|M*tm~^3
z^8^(s&;pJxYp$ytU~^NzT9GVb<xQ4<%1^9;!B(IsYHJg?zG&U{EvZv`N#S+cC&f6L
zJ6~<&r=ekaXQHACeb`Y`W=04M#QPpaT(40Op*#-i{{8^b`aS(RS2AHS#u9tcm3dc$
z7%c(8Fn5uZP>DaL5EK-g)}xNg&(Hsb&w}OOVL7Ui2m*oD3`N@!CSK?!Hq@ian6ntm
z#4w}0wnm$BUNATWh|UBrKE_@|`s{U;2+2^g0bt-TWWYU@kE5?%IdF=Pk6+Ep$Y=xb
zdC6lm)cE=Fs$ygefI-R3+U3&jXC8{tlYgRa`QjVHdVDh@KKoVwt1^}+y1kK}+AP>y
zT>Mv3F^FDV95jD(<Hj$3JJD$H`ubXOc)HjclD!=LxIvN;q!NMHc@liA(Ud2I;i$Dd
z-L7-4!I6<huq@|Y_(y|`3X4FR24^!pGcz%8UhgM{BS1%a;o%2o@GyPv$4rO(W-syf
z-aQH-CGpojuCytg;+Oipo?$v0T$O7odr}VN7}(LVlsMn%Y^<%T0MbaS8c#bu&R}I^
zWF+F`oVVq_ec(0StMTpfQL*wj{Vkqf!x92fTApr`zY8-(uj@J<w%UCWz^Ku!kcXQa
z{|^W%pY`9Slai9kpgC+S><Wu4Ts1T_wxYjhYJaUsGK3xOIm_rS!l<-cH~orxI?n)l
zO;FDSORMTF^2NkbRFwl|6oE2+R@T-p)b#W=yigs|sJ><n%AY>z$<w2i;Ga7#*E#r+
zX)`u)2>GsU&ny_r*!R7$Syk<*wHcV@oMnnZ4GYK80k|{+CLy=5u>B`b&n025%s95a
zNUi>#_Ps!_+x>{^Y9xOk9o?<nt6h%4t#$eidA~Y_G*8->V)lNrXTk}&!$OIG5%#*&
ztqXjOI{93ZbctS@CFpjzl*;^TG)IURlGFa#CiQxIKDg}GiBf%W%Zu-xGz8L5)I_>I
zUlO-F8MZtDGFTMzq-+RSsXK)d##X@mnVs!7vex{Sga&7HlV|a67+fZ0cG%h1*Jth3
zb>IJ}5PC-ipXaH;Bb6Sd-_Er{co%ps$l()K^|i+5h0ovaqA^+`N5RA6K0hVpuNMmH
z5c6@DF*P+cxcg=}dwOV4sgh5ptQ5~U+wP|S?M&CA&-!H9wt_kCrG^mpWk+;fXkTOj
z^|`-G-TvYhs1zJ1)ckdRIDA5B_t`xv#aqPKM@nk%G$m!>YGN_bey67h0~siV5DZo3
z(UCwot-{|R+7=oVd}6ivFhwQ)vYvK?9U_o1H^<$>4(ej61ORQ8Wyg<$gEOC;tSPpC
z`$YFzoT6{K&WqHtyh|2=kH4wm46i?kIOBP$o6fZ~GrKU=&ihS|0qB{$qYoW+G%Pj>
zcbb(oN(4_)<Y8%UA~`9k|G-8-%wNJx#=f$nFVP;x&d>N4Oz?m8oQYGPMRE}k#yb*j
z%*FkW2O^c9#G)lgds`e0Y>*;|t`-&-m3ejOxw!s;*t@RxDlx?bo>SU|MzT4~)_IHZ
z8Lz<xi%|Sg=ktrUpshvs>n;<hgx}BAc30zaqc}kht@rIRl%8sOdV-IuHaga+si~PB
z2Rk?3Hgj`JV)R%@@!6Gb+Q^^;n#bc(j$_Yx=TBKd8xcz%{5n%O5w{V34YpSIjJQeP
za79^d&N<mcOLTm4a&lTwWbba%EdP?#i1`H-pG84c(cn2zP*{4plz3v>7oFtG#Zn1g
z=i-cU?FGjK`n6sUhLZEyT-;;FF4)`TugB4o3?&~`>gP=jjU*FcZ;mToH;_0$Aj$7<
zV0uM!^U_SwdTkncT?nniZ^xoNIc%l;dFY0O<N{3(bjDMB9|DmgiYACy!sA+t>mm^q
z7711?YCq104=tmX4Gi2`3ys!8J>c4)fUfxQgDg^BJN?~M^&iXepXw{v^R~`D>8qT}
zuAh96JJ=|xtnNWfk6=!Km>YOKOTd}K1H0vHIp|Tz(^EULU0P0r{AxKaZi0S)Z*OAQ
zXR<q<@k+;{Qz{m#%(IPRW~(ZEuhJ`StlOG3!Y`v8oXi>fT4x<CtlzngNri<9%tr|5
zy5H?rYD!85&!8ab)B&wxT9vYj%4-s^Fdmp`ChWFye0vpz`p_yBJ-IS<>5f3!HIfd5
zBI_uXaMjRyQS<nE;}y^#g~|Fn0TmW;cz>Kc7k9)e6hc-9IT2BN!2a;$_#|yeB0vXU
zVvoEQcFE}JYR<j>hzFrM%F1`7aQY*d_nxwFh*XKuvIJPb;jotIHo{>?BNuCw%bT0`
zL;9s|ZmlbL=xJzbjGIpn&<$%&rUMd5i{{zQ6dg$}UF>Y0iCF1D^0$}<abrI0mchI$
zkcb{x={mXzlI8OYOzdcAbC<s8!NKs&Lo^ri1h5|<3ibdcX>Byizht_5sPEvSoe`uX
zwOkmgV(*DZ(qSEuc=aXyj0xVIzqVD8g!0*|LY=Hu5cxXCyjxQ;SU6B0JNkz<e|`v3
z@drO}px-nqyU2TPCS$78Qq>At0mrR}*e~a~<7E4t<_erE0><mYTR(f^gExn!zgN&s
zfwmr}e8+3Hd)%$fQp?s`k&ER9&>pRhhMi^!?XY61T~3P0X?NHP*Jktbj;)ZV__j|$
zJEh$>&6&R`_yN;HKugCaZd(%&NPVeLTd4heSg^J1@T=I9C@$SgDufBmnH=F|TaII+
z%4AuW2hLgMDStyfpzQ!&1K455sXE$0y1ER3YYX>@)beDn*8`Xz%2a;v5lI$Tz{83s
zQND)bPTzT&+DuY_z=!)}7*|jC_?o{xti$O84Fz$f<RAKIrIx|?RI@do+>WLMt>j2g
zpKb|guGU+FA_ZOk8jqxmd{+0B`m9{;D|*^4f9KE}6a1A8GYtAN*;yA)tmy-5Et~~y
z)Imo1qKVP$iNn9Q3x0q^P`SAy=+M8CCwS4avIc}m)Xg}U)+_URJ7}_|TCA6(Ij@fe
z$|=6_tC_Gwl%A5#$YpCb`qizNVv?ahv<dI>*@+N3m6E{_l0s-SmAIGnTG0{5y?!ej
z>GQy`mtqVcWE1Q4u`>Q_-O}%Ly**TZ=R6Q3!NpDam74krj*h;eOGi2&_O7ZJgiygx
zutImD300>F6;?d$<1T2~6twFiOb%&KZ_{;}c7};^kva{GsJ}PJ%LR-2=d5CaxRLJr
zy-1{QqN{C0t9H{qD7gMpWbE`h@;7Bd^tQD8`#>h_DcW~*%UimZR>>h!4kL)dN(WZ3
z$qjE&fw_O0S9^Cs$;$5k>fGcvo{w5(X7;U<F-<(eLU~ZyV7KAhR||&1{w}izs4US9
zE*L;eRsm2(2V9qpl2Jl@{L|y@G)RH-h^^t3*gOK~wD*Tr0XKyBLK&T`C@!$6ossln
zkts?nOi%#I$>K72r1*LFsh5g_(32wIt1?Nv-(J8?tc9=b1nWnv`Zm+S)5S_qkM~We
z`U)9fDzkHP{wZn9eNGPfkfP7A4T@`e-|9VUT`P>Nk%d>DgtxV4_fT4_V9qb;0Vx<Y
zB3?x$@7$&sDbAgyN1E@>tyjhVTrq;Ya@8s{oz*NXq+BU?KlzB{>C%k(4CZvJ*Yx)`
zr`I(W5~a=K-AfbZZKYt>yr0Ism8==-px>8p{bp8?bbI6BNgw;2`_29<a|=^lf!-ln
zf9w=KBBWE|;qvvN2dD~Ls$Bu-V6PaN&R=`LEKK+LN5aY1jk3+$ls_#Kgj)EExc((d
z-6Ss;$I6c6jG@4mEsgit`0=1skscERo}+(3G%`X}fHy5x5egSdY0aOXb4*Hj6p=m&
zrhY_H9E0`MGlmxDBIdKQvY_RdBaM*I;Voc!;DBBJFKRmw-9-x76J`hK=rg_DL7wUu
zo=Lax*0mH6E_~nE2y^il+wSqv$DCn@r^30&%FD`XSYALB5fSkp=im0v9z1YW?rEN5
z-+OxHzfLUIVhg?Jp;(92J4BT`I9E?31P_;X5t$9Bz_snWXYj`q`Loc^pR+=8C1eVX
z+%z;bJu|bkCx3x<s_*WaPY&hcm)T4`jH$P-65}5%c$x`ZUfcbCba~%vHb_#OBPNTl
z)QvW)vA^J){+JKB6cDxHh==pt@l}0TC4H5n1V)Q9=vDjl;bMJ@d-q{BBPS;*B`GP(
zqQWtNMBvJJ81g}*>O6Dn!DJyQM`~VJwV=DaMp4i$m;#}v8TH((U};0{?UY00;TVh5
zRa?BeWE+Ww?;+$pB{h}k!sXgq<P$)>69DzniHeMCwXv4NAmZvPo&UGgwXq;+%{8ea
zTGK-baWsD~%oS+r>K+|j0z|&ZJ~|r~n;CZP`lMtNeTUDaq!?xTG-H|g*qp}Z6-J4q
z78=YhY6ZOAb5eEW_a%+CzV_b}1qe5w34gY1(z)zd^WY$Q)f?PB{b27F@VuIO8XKfN
ziA4W3!ABn-fZoPk4kM23vXZcMXzTCx(S58&%oxp?0?m8hzU@cdMKoGE{Ai3sv0z*F
zW}#{VW$vI^+uoO7i68xsLlDUYEGjl{=r-D0P{dDdOhxDC-(p+J$$!+c2dh|{YIgdC
zzJJEw7@%AA9f$lV$Z%4`z_gjOflo?%IFurG*<i<F;bDw-#gj4yMF+@`J`~N{eKdNn
zQdj#b`l9u#-vY)+iZz+11byVyY>Oj1xxVZqS(BxJV}F&^paH~(ix@Q^*l0CQz<D@W
zUyk6SI8|6jzqfPhPG;P=cBX^g7;%rfmYr(r3ugR1jqBdsYZ}_<fG$$Da+te6IcQ~u
zbQuqh7zG(Q&mL*l17mvxpkNc?v|I14U$TWcD*!8MXkGxgEPv&%Yp3Uf@^ECeRWd>I
zSe;$~L)r!WEa5h!==&WfWa{L9ls&+a?o6&RAM0l`W=k6xTe?rupBQ<IKZYxVZ>{%E
z4>>l74ljr!eQY2p{{c4{0B(Gyz!3f9<Rpm-b$sfxbMIehMw=PKYgkK)s{HEPGFu_k
zD3A4T=>$JiHX}<t60+knpC9daL?BhwtqV0IAw(`=E)(hj?lb|z2-vZxa%H8Zf3tAp
z<s!eORYt?|Zw|69sgD-0u@?8dp^Zs@x0Vs$?QbizWysziNTnOv6@8DmjF#rN!OHul
z<&s|;2ZSRwP9Ko)asOCy4Gg(!0d-n{DfE}!+X9_@-7q#MPvvuwW7Wug&<1Ai#GAB}
zkqmc(v_Mt<tSB2X6JDP@JK+KS@;>kLr)zCO#H^OV97%7!fZ}_`Oh4Fk0tJ_wlU<m;
zP{R@p!4@~csDZC5b-T$vm?GD`s-<fu=>L?-_Ks8YQPxU*n_@8Y?~e?dQgNa5g@DY!
z)Y~@<j{~JDAFB>lx|di8<=o7o4+8}{>>_7nrJ;(4=W3dZ37pf8)OEBpAlF@?184da
zBSE;DR1>L)THJIO2a>3ha4`Qnqgr{1jf9_;Vb@xYfXcUM9#!f6w`JTZU+|rT=lxo+
zX_?e7t{IhuZ$;9gm%OCaQ3yk*UYbrfmui*tpCg4t>MeVbD|ob#!&DicP$@fba;<6C
zn`SFr-_Fa&P#d6*ez((w(Ge@IOtawdr8u-*SeQPk{qNsKFrLnvwH7{crz>*j&)dyF
z#y|2<tcA2}C(I33c@Qe$uk;ld$#Qe`pZ=yEa~6--8~2bqa7y$t+sQU?jPd;)q%%Pj
zZgoQKs9L&e&{idp=l}0JX3)#cHPgVqq1f~)$dS1CAC5(96WB{*1KEQ@x2OEsH3+k<
zSW?*Gfbfj5^Bl==d0k|r+5=jy?U!~F>9<v8Imgw4WR7FUMAmX7hRehK%>=o9-cI4|
zu(o1}h6cWA<4(R;zX3)Kz~ciHeOnzoen8yq3+6TLUt=P@vM+=3xVT8kErbMeFW9`>
z7+AaxZifVkr@eD9={6Y)K%O<Iqxu*|$T=}!w^uFPHY(NF{Xv3g2`;)#BlboZ=^qpT
zgYx+A0NGqx2a7y`o{fPa=j&-ksUht2BX?W=3{}3o@R=!35|C_c#itc@R-*>*Tq3vr
zL{7==GvzF(dCZM*DX~`<DhaCURVTdLGS)=Qvqiq|PyA8f{U-{YKHSHhjg9udaXz7`
zD(WLs{>AgVu88a3-~H3#@8+Hg3JOJL*%kPYG`~jj#;Y?{i*h}vQmX&0t2dEv$1W98
zYs*Sm!bkO=ZOQM5S>b1FiOm?6hd+F#<w+keX!pm+VkU?qLvak|Wr-8IwzR))H6vf?
z=EP0FbU{?cKv*8Kg459VwXTz>+tJBXS{i!I8QIUp`|fJ4<Ony$d#&q_9|dv4r_b$3
z%?jnE*obdQ`c;*saZ)B}%uO)h1}QRiMSRgxfsg9+M#w_7`JEgD!7h6p)`|sNTqBs(
zabU7+OJqaHPa_<CT?CkP<ehhL{u4zkA*O-GdU~s9VT$}Rg*l@@rV>|JInHZJqh)F!
z%Z-0;sOm>BxybbU!C7*A_hJd&$?Z0H`4x4C3`BaKKTB8Hq*yB*u#3h+Fzx>GJi=&O
z`}$6Zf_4doX4txZ$W7*(ZDGMcerpD1%^tu?$5N2$pTD9I$*{?I(N9kN7>9?1PtLhW
z_e!;N0h(>qmLZk(YlLB??~%VPxX?a=b0Oh}H|BoFnC?8%Hw-A0ajVA_D#5)>^a>em
zWL;wdMoiBQ(v4ZsWN9RuLM^K0*;4iVa+O}d;0&4Na9k#liT_Q>ELUw_+_-K>(N@o0
z&nrAI=oU0w#<8&vwylsO2?+AQQ(@p7nYyrCoDa2u77UjzmT6^M#X9hSixn+Z$$jb6
zC_m>41n9kiTK*sX^Yb&wBy~K$nbc?6H^g3djTnOz&j{Q}@ylYqkIhNqEc~V%J7PD^
z3%~a`t?&sQqW-=omZFaY-1G=sL}$0dbkku)NENgSd#0tNOk5dG?S5nXE+aTkuhh2r
zhrXx+KJ3GoOW~(^KOd-Pm{Ub7Th<BLv-f`tVH-GTY!n+KCK2GOlFh(U{tt_1a^_Rr
zuxc9@*=>~FbU(wx%a+N24{IyU!0$YjM@&GVW2b9U6Y{**D4@R{`Bijzye9$T&-vw<
zuSnKESZp0P_6NNec~G^}&h<4AutO0#RueRB9j*|@d^Owp?P<Df6l#pEpuKcRWWQWW
z!6Why5VZ{~w6q?T<$RwG9;*~WipkF`#fyv>BkZo^7?cIb-t=hs`KS4*%te})ztn`P
zI+8fms+pN5l6vK6nN?Ke61Sr#eC2mS8(LtX(B-T>^SgTtDF?zCX~6iJ5WN)^6<IV)
ze5c;$%A?ym7K5alD)wQjkv;Z1kZqsb29gN)zL<=L^>=;5yd54rfxXtr3(YRf{HDqC
z0lJO-W+d{B3FGb#31}M;OyA4Z*x1;fa5~Voq|ng*azIPkwtASr7A|S42hmKEpV^8_
zX}bL{c@P6vo}f69lRb>&z;O_w9f<l{vfqz@3jIyF8n3G55>RMZFD8ot=^)O{;I!H$
zD9pshRx?ot#OkogOlrk5{VjF=aAQU#f?#`wmL5!_#(qn(hv;wDN&LNzkGe&N(3b)@
z;)JVi2o|dOi28no(=`eS$TZ^b$Kh7vY4|Y54T`Bhf3`7+22>|L`xX(CBOeHOx8s2y
z6cC@0JMd|<5~3NdOx*+#h{(5gkc>mYT{IlJ_%^F^3~YhG;m_$Ov11?5i*czuT;VVM
zp^<4pmz%waPN8%}cz7~l_u~<eOS@r_N|!IRGnvC6iOQ9sxMZ2S<`I8NVS;Tg&L+J$
z)K-jFAF+A1$s!G#rxQx2$A<4)v3#6+0S9%T8Yxs(c>jb|>0sh^^mW(|?{<2~5``@@
zW3a!XP%7*u>BL9r-Q;V0k)r*Mdo(R!xz*VrvDkTdDtrPs=hY-fo`}yXDn1|Stg~i2
z+5wurV`6$G;v8emCx|pJ!#dTdfBNje?>+5@umR7$<_}ZH-Q&bTL|O#eUtmlNw8JCd
zXV#%gbpI|*L{9#uY`j(QRJul!Y9XBnGc8=L89@5_tFro-Bc<~l{az4qw{!jzc}Mga
zdP9op!q@sY!9y26N&+T0+)c&2okN98vZ1jtj{_Gm*tdXV-jeJ6V)@z>C?wdZ8i4m2
zTXnI($>3!vVRS>{Xmt3K@>}`~g~(L^99pT-ZaQA<%e96bN5e(?CzIi?Fo0|twzft=
zZ*}Co>IP5CVq@>02@^2kqWF95^merdB|2FDL*UevmhL6TM_7^&xACY|&8J}H33`c7
z3w>RXGw~zqrbj%Od)wK+&fyy|K9W|(B``2X>0fgpU087|>WSAZ)zv6Z5p~qRo94=_
zQgn^hYc$`Un%eqTYWDi~Z@TuyR_<+q`q5(;V?o;wq_X%Fja_@WIN1409rM0>!i&#D
zS(sPhr@cqEAZtNr7JFSn|2%(K^5i#baAUycx5HG^mjH-FM(d;V#~iAkO-=mCtq!C3
zo^1Qy1PFrOp3?ubUbgd$dk^cVR{X@J`W|iwjnojiYr?w7_{&HBZ@73J!{pRWt+UO1
znn%+HDuGc;CPBqsEM3UL?o<K^Vu%UlF7ZgR6+ia&l0B$zPO-oS(@Pvt17*5HLqmZE
zEtViF-5zt<IfK%{n@Y6(b*Eo}^zoN1m(U%awzbBEJ=coMG`|68l^c35;Ie+h)s?hh
zfaXL*Y*T_do;sGD^@Pyq2SPAdBibb@@m$ae(Y%%N;Q#Z`<Yt?~Lpacv3<~J|Zu5wH
zDbh|W3E$cz_#7cDiyY)^2_wvU^;Dz9)O+$e*KA&^l`I#{r=Wjd-P0cc=~D@U!Toiv
zQA44p`!>*rLMRzfA2zIZ<Dlouxk^|vK<=K!_xoJ{{ho+ZKUUTAQNFzTZqKx{kJ^_{
zAVCzfHE|c?1QQrZ=HgYxf1}969PZv$?Fj}8G^+rPdvkHA4}!Wr`BF9h2WyKKa4`B+
zfCX+0$6>;uiU_={u3?Eh)F9%4U}_wkV0a<ZM;;f$NN)3mX0@D@*_{`BBzp%_EOGv;
z>mb<DDRU~3y0T@{aeom>9a2kww|1LgdbK^~b;Is@Yk``8?%6zzMP9qw-7iWHyOGOB
ztcrg7cDBb6!hnl{1a}K!W@OA<Z}$fV<W<nkP`W+Z*)J_Bj&c}K#o9?&_ldYIWHus8
z+o)5?r_9b?_^q}&S@#{`5<>|;bw8U|0BS-q(A4|3_xdm4P|+eU^KZ<+PN~oE6;2@I
z*oRWcrL3qW2LruS0%QGk1|Nyj0GY3M!wI>Vn8|6vyUf#07q#<-iA#nA;GBjsGy5HL
z$AMU1Pf~K1%wNpJQCGYNuD#hYy7?#*($mVnpjJ3*C;&T|dONdZ7~XOyHG<ew+iN}$
z;E!fya4g$L{P!9+1|6W**BB^&oMY(unr^scfkA|F;H25o#wNg2HxEc+x)@y?D*6hi
z_I4W7h=zu?EHqf4I40JPPSKs0eikgGk6aj8j5JsNo%y08!7PaRBXF?1ytvdJ!fsy}
zBtUW){P9~t4gz@nDq<v;`}b9@#4Ru)dPw8I(HtF7(sDn64Y_o=l{;@0L@gp>n3C>g
zTVS@CrHz*3hhPK!_^#JN1r@6eXI^FqD;M~I4v01XB+9X<H&d@%PGw5??GraaW)DxT
zm<SC<Ds=I9|78dZn-M5kk7&5-;%*ES?eg)(G<f9vxfcw(IRVZzgn@K6=PCa!e)B&b
zibR1!WkS=y;E9zHw6HKQCAx5>P2EqXf`9vLeKa}PPC<q3)D}~?5b9Hm4L;yE+u~#-
zN8s3~iP!($Qr<H#TweJ$J~bQrpHOUK&dS$hgi>DiwoNhG8!9ObQ{#(urc5=suBAQ7
zpEYe0-UcU)O9Ak9$lxYikG{DeJkK*nj_CJ@d=faEHn}cfbot9qRiO})nmbN@GZdu6
z%IT_Wn*bhCe<cVG`pf^ZP%5G`_HTy%RvaS=Yky9?(j+lQvBim3j@cG@dW6s`c){_H
zw>#3?`g-n(^9paM!)C|*7O%ZF#RX|_-}v}h|Mw5{BhSy<OIFL3>gWlwR*%h+VK+f(
zKHTcBo8EC`$JWp5H9hE;=yq`;mHo#R_~C|5vNGMo)NHM$#T8`KPy#eKS+RwLXFsUH
z|853E{a-lZ_kEv+o>4agVVQAJmi(@|Z_CZxlYkR6pKUc#-=4OZ!KuBO#s!M^Wippz
zqP_T*kCzM-Bb*p6jLX4Vvr6A>`kVRUYSlhAbrD(M>4y`a&)(7M-%}6e^gVI~ay)E}
z9S!;=IVDgUv^xDTX|%ovBMdcz-XI3iAW#rN$RA!)@h_n$TF>v8J-t>1-rL?v=O;6d
zvaWCom7JHZs8qnY67{mVk}UV|Mw5#ntF!-NfIn%>zrK(Y*lz+eu-%{+&)C@u%)y5X
zgCA3lH1uU%jtm&?EN5c#dZfPi&%2Xbe@L(o!t}d;Lc4z_Hkn6hUE>Q+sr;QtSF8|^
z)sA1poK;>_DoUHjtZo=B-L1~CiimhcCLv<ym+ka}5(uk>fxsa~NVOKYqVNRhC}1#v
z6vd*m$2*RoU+|>Gd&wf!N6hq1Zr;nC!$uCYKZ{V~>BlkYn59U?Cd#5Pi5wj}!Ohj|
zH+*B9Kn)7_Eix~r4<xz#Zc^lLDwvI4Ab+xCz{#zdVQuS2LqpT!#DF1c&#o>g(m|7<
ziyhq5LxthKB3v!Kp^kq5TeM>2icW|(c|ET)|DGf3%JiM#);eDHX;O>MDj(6(w;H~!
zC~^fe05KcB!DZiOo)%}cYsxAxFz|_4o8~*(8M$*mnJh}zO1nc9!Nc(Lo+<zHnd@-`
z`GK_KusVsWdVmLVuqjS928&{e#_$NmyP~aHl|eTo)pFok6vBTNwfLCO=UPc8NJy8w
zhlNxVtqe0dHI>DjJWA)uhKhm$QK8heb)T`8CnK+MlvX-wU|<tV_$OIH_DYN8i<=FX
zluXSvaa5qFqM~Q7t6Br?=0~>0$)H_}G`PNbN*gkxsLP6#XuHhvU1o0RJ=FS6w{)g(
zyuP)5>rrg1?44Hk<DGLAzJhh>3<oM}QnKb2FN>yK-<omMGWs~h{ZOgXL!!hnZxv3o
zTE<O=3{^YGO%I6BjYCWe)NMi4%XNkYvgySe(3gJ#+!fyS+Nm~#bZLL)kS5NK&F>8<
zDwi@tTA-QH#<k%nyR%=Zv3&7jVFcZeXD)zSTx<Dl)>~aZ;)F|^%fZjY3&#y(csuc7
zH$8RihRFXd9QV&w_cj|ROSX7W--sdGvhA|JX7!CiJr$IkCrZeSPX7H+(&v(ia!q;@
z4W`uGgdQdo6cpeZQdqXoGElPIzEW+aou!xT>6ywbNJI&yAU&T<((`hIb6J8kLm0f9
zfHqXH0Q1YRPaHj~6+{}RL$<01Q&3ib7p+mwgH~JPe~`)>Swkl<7u|+{etBkyzZ2gL
z#(+|`CV=U?FTnc~3Lok$Kssfj&S^av6Cf@i&^BAQRjP0C&SdU~1%bt%4#OoNz!dg>
zoY~0F-_Zz>__lBj=|ND^H;5>lvI6vb7dsB7KmiC&D#6@q<yWz*1FJ^<_-CE9Zxb=#
zp^tvT@|1Uco(D%vNfx$=FriacTS{NBT(BUhp2(J}qE>$H$hEh1>|%|bI&h(}rs)#@
zh+SGG)zAD*GTbFUVnL`pk^hQ`br4>t8~O`wpvqMm!bzD7u~8e<g!o0m)h@Q|k+Y$K
ziW7SEDfqr4D;|pr(0->6nK7xekCCOk^8&8G!4dy|f4rFhS2o|@+n)o1k||%l0e_%A
M$*RcINSTKI9|cQ=1^@s6

literal 0
HcmV?d00001

diff --git a/ui/public/logo512.png b/ui/public/logo512.png
deleted file mode 100644
index a4e47a6545bc15971f8f63fba70e4013df88a664..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 9664
zcmYj%RZtvEu=T>?y0|+_a0zY+Zo%Dkae}+MySoIppb75o?vUW_?)>@g{U2`ERQIXV
zeY$JrWnMZ$QC<=ii4X|@0H8`si75jB(ElJb00H<f^p#K#{|oMlvZ~_$qS5Nh{~rCn
zA4Y5cVZ*go<F$|f$hFu1n6>AB%>SlLR{!zO|C9P3zxw_U8?1d8uRZ=({Ga4shyN}3
zAK}WA(ds|``G4jA)9}Bt2Hy0+f3rV1E6b|@?hpGA=PI&r8)ah|)I2s(P5Ic*Ndhn^
z*T&j@gbCTv7+8rpYbR^Ty}1AY)YH;p!m948r#%7x^Z@_-w{pDl|1S4`EM3n_PaXvK
z1JF)E3qy$qTj5Xs{jU9k=y%SQ0>8E$;x?p9ayU0bZZeo{5Z@&FKX>}s!0+^>C^D#z
z>xsCPvxD3Z=dP}TTOSJhNTPyVt14VCQ9MQFN`rn!c&_p?&4<5_PGm4a;WS&1(!qKE
z_H$;dDdiPQ!F_gsN`2>`X}$I=B;={R8%L~`>RyKcS$72ai$!2>d(YkciA^J0@X%G4
z4cu!%Ps~2JuJ8ex`&;Fa0NQOq_nDZ&X;^A=oc1&f#3P1(!5il>6?uK4QpEG8z0Rhu
zvBJ+A9RV?z%v?!$=(vcH?*;vRs*+PPbOQ3cdPr5=tOc<a-ro?Zc5la+tVgj!hwG^F
z4*)z+Dj6T#D>Lqmfx@#hOqX0iN)wTTO21jH<>jpmwRIAGw7`a|sl?9y9zRBh>(_%|
zF?h|P7}~RKj?HR+q|4U`CjRmV-$mLW>MScKnNXiv{vD3&2@*u)-6P@h0A`eeZ7}71
zK(w%@R<4lLt`O7fs1E)$5iGb~fPfJ?WxhY7c3Q>T-w#wT&zW522pH-B%r5v#5y^CF
zcC30Se|`D2mY$hAlIULL%-PNXgbbpRHgn<&X3N9W!@BUk@9g*P5mz-YnZBb*-$zMM
z7Qq}ic0mR8n{^L|=+diODdV}Q!gwr?y+2m=3HWwMq4z)DqYVg0J~^}-%7rMR@S1;9
z7GFj6K}i32X;3*$SmzB&HW{PJ55kT+EI#SsZf}<HMwvFaF@TTvjK|r2I5vs2LpffL
z{Bv!nm|BcMhd{9tj}v>bD7nW^Haf}_gXciYKX{QBxIPSx2<c3y_W_ueW=lkplo6_C
z4pVF;!S-6Ziu|Mq`r%r``(lz68Cu3J#n^oDot`%+UFGP6#%tPM4xaP$n-~x$9>Ma?
zHQqgzZq!_{&zg{yxqv3xq8YV+`S}F6A>Gtl39_m;K4dA{pP$BW0oIXJ>jEQ!2V3A2
zdpoTxG&V=(?^q?ZTj2ZUpDUdMb)T?E$}CI>r@}PFPWD9@*%V6;4Ag>D#h>!s)=$0R
zRXvdkZ%|c}ubej`jl?cS$onl9Tw52rBKT)kgyw~Xy%z62Lr%V6Y=f?2)J|bZJ5(Wx
zmji`O;_B+*X@qe-#~`HFP<{8$w@z4@&`q^Q-Zk8JG3>WalhnW1cvnoVw>*R@c&|o8
zZ%w!{Z+M<tG%{r@|BA#vF#4bf!f++tPT5ym8X91BldH}+AI}Y|vX0!&r;lt@eS^lN
zvg`OBp>HeZ*OE4v<xX`%2$O4;S;&Cbv04cU5}9n7>*otkZqz11*s!#s^Gq>+o`8Z5
z^i-qzJLJh9!W-<EsXOxneQlPdVDePK)>;SmFkR<yAIkG=KFv={m{2U06G>8HEZ<d@
zt-Mk%C6JOyyG;Tv=hp@FaMRsh9p2N;-8nqS(z2KtL@(7nZSC(RXHEa2p`gB`jgK!f
zO!Zy))*;8CLtHznXwkD}e&!X(!hBWIP31$_mJ0Qb0%nbgBTMCL4HMpFsK&}NkusiS
z)A#t)!I!l!vB<6_T!LTOk!S`bCf_JCqRZ0G)JH4uX@iT41bzV2n&>JWiXk$40i6)7
zZpr=k2lp}SasbM*Nbn3j$sn0;rUI;%EDbi7T1ZI4qL6PNNM2Y%6{LMIKW+FY_yF3)
zSKQ2<Ya(Kkoy=zdC9*YK)(E7vJkX5gaF83}z?|lmq+>QSujzNMSL2r&bYs`|i2Dnn
z=>}c0>a}>|uT!IiMOA~pVT~R@bGlm}Edf}Kq0?*Af6#mW9f9!}RjW7om0c9Qlp;yK
z)=XQs(|<cGut0+-L3r!cqm1tE6>6GCadQbWIhYF=rf{Y)sj%^Id-ARO0=O^Ad;Ph+
z0?$eE1xhH?{T$QI>0JP75`r)U_$#%K1^BQ8z#uciKf(C701&RyLQWBUp*Q7eyn76}
z6JHpC9}R$J#(R0cDCkXoFSp;j6{x{b&0yE@P7{;pCEpKjS(+1RQy38`=&Yxo%F=3y
zCPeefABp34U-s?WmU#JJw2<Hy#VJPjU_z!blTTddQRvmJ;M1^SwGhk9F3L!VYgE2}
z!hN4|O@-;WQ~A8Ac|siS)QeHnw6sA2IkoVrt&@Qs%P6~@n5!6r8e%GfaPU^w9TIM(
z+qX(?1}UGxDSvKVX1LW8iFMjeq>3dcC{sPPFc2#J$ZgEN%zod}J~8dLm*fx9f6SpO
zn^Ww3bt9-r0XaT2a@Wpw;C23XM}7_14#%QpubrIw5aZtP+CqIFmsG4`Cm6rfxl9n5
z7=r2C-+lM2AB9X0T_`?EW&Byv<FnI6caTN5D)MUOu9(rjGJ}|99fVRv!X=m8I|ntE
zJ6XpQP1)X(+6SBV*7)9sgp(5zk-^p1E@|<-2^-l-ZW#Kj|IJ&(K=R75?+0Sn{(BV|
z)<!{Xjk+B_tZ!}_{^w<QMOVpX(FpR#8=7_$7TdAfPyiOWZvo8WTqZv}@;S*lPA$Rs
zn+2BOVa?j7wIw`|@yC+YqijL$-?j$YqnBw9uWnNX<bc*#<Sqv}z=}R0au2Xj__+Xc
z|5Zi<%3X($k`eB4OfoyCoJfrfsnP_(kI)~k#Slp5==?)J^f|>&K?HS4QLoylJ|OAF
z`8atBNTzJ&AQ<Z&$gy`^x^JOg-uapGljHB_jawUn+lOR$Lal;{U)TVO@l6XlAhXvf
z&}RhuqQ7a6<jLsJ0)_9Tl`lObK+u8*wmYdM+gnW=+v~Cg={2^r6A-TFvKP$LTFKFk
zC%VN!ZkZ6V>!>sOo$?^0xj~D(;kS$`9zbEGd>f6r`NC3X`tX)sWgWUUOQ7w=$TO<q
zW~{Euy_99}%58ATz~`-F(jnUkM{m~L{o=;3Hl9hX$s(cq;5cRA92lsb@Jg~cz*VaL
zt36Y*Oe?E>&*j;=u%25ay-%>3@81tGe^_z*C7pb9y*Ed^H3t$BIKH2o+olp#$q;)_
zfpjCb_^VFg5fU~K)nf*d*r@BCC>UZ!0&b?AGk_jTPXaSnCuW110wjHPPe^9R^;jo3
zwvzTl)C`Zl5}O2}3lec=hZ*$JnkW#7enKKc)(pM${_$9Hc=Sr_A9Biwe*Y=T?~1CK
z6eZ9uPICjy-sMGbZl$yQmpB&`ouS8v{58__t0$JP%i3R&%QR<t`@HqaIe3AGzxCPH
z06(XDO&~Ok$=UP%vG;P&hu?hEJ29wAaM6E!HZ0R;x8r*qHy+!hZxDYg-KGZI`{P_}
zY{dHlfnW6S)?CPAP)zp_!xelMRGuAo@t@!gSdowYtvHr8K9WNNw}a|TzE-87F!WRs
z-#;HoNH5O`b&7Kri+=ag7)^^;3^1?o2Q2qw@}+ZE%fAQU-nq{%`+R|B7FhGK+M!Fl
z2ZyeAFYON2o9at)@lQt2WoWTyBs<V9RDa+*;620gC9bv{?izYvGuFv(YU1!YDK{kN
zfuajP^aW|>3ianbZqDs<2#5FdN@n5bCn^ZtH992~5k(eA|8|@G9u`wdn7bnpg|@{m
z^d6Y`*$Zf2Xr&|g%sai#5}Syvv(>Jnx&EM7-|Jr7!M~zdAyjt*xl;OLhvW-a%H1m0
z*x5*nb=R5u><7lyVpN<INnH%~Yw@M#U6Pu*P(p=#E`62!G$HpM^Fj^SgYNx!W^2fr
zkI!m)izx6Dlg78SlE~FIDdEd}c|raeMkO<=|63PClZI~^epYjlJD}Z`<%|7DCiNUv
zG)@)s+cUFWM~QdlNaB)J5z`+Rh!K6;Qjn|xbp*GZE8Oc@gJVh~Yk^QNmM<N`7=nyt
z^&xA|=4HLov%ZKEejPsm{k;ktCe=zCR9B1@0wmg_efnHnX;*=is!NwZ>AR?q@1U59
zO+)QW<j~4qKP_fJbKV#dkbk5|s_=T+xd;<8uKpNiftfsnY^b*vkT2H1%VS`S<#uK|
zjNMI3R($QKsX+O9r(;Z277$LfqVgbuD{2wsZBsx#6p~V;+BiVs555-sk`S_(uZ4+h
z)<$QI#xEv`Eka6DmEWW&rUOf*Vo9$F6`G&Jq7J`r0+jS%Qxqc#v^D*NyEI1gB}|q!
z)+rEYS;WOK<Wz?e_Z2Q0;QX0^^7`!HvIf7)1y?Hoj9S$VrgX{Ye9I!Bx85oCC)?4z
zjdu{7tR8-C2~=B$IqnW+8OcPpDJW2wE_8+TYdyClF#Az`1L!6t9*pZdLVY;p<yBtF
zOm~+y=m;=-2Tc+I$K4se0R$L&IWm@H&UYad(l8Y*q?01q-iww`%aiBbF149`>wL8t
zyip?u_nI+K$uh{<eXaA|n3IG+8OrGZ)9HGA&^RJ{Jd9>y)~}qj?(w0&=SE^8`_WMM
zTybjG=999h38Yes7}-4*LJ7H)UE8{mE(6;8voE+TYY%33A>S6`G_95^5QHNTo_;Ao
ztIQIZ_}49%{8|=O;isBZ?=7kfdF8_@azfoTd+hEJKWE!)$)N%HIe2cplaK`ry#=pV
z0q{9w-`i0h@!R8K3GC{ivt{70IWG`EP<iX3`qZ%H^f(R!@OED}+3u4g7{Xr9UwpnK
zTOD@;FUScIf-f4;fF&{6twOyC0W6O!P4PKEm%fJY7_abkr=vB+O94OwvhK{ZP6_!?
z<iuvlT@!faRAoB1`yY6GRfnc*q1!>|(1g7i_Q<>aEAT{5(<ns<#%dS?L`x`En%)Ut
z{nCo<KWFUh<S<CDmdO|;fv7JLuUS7^E}0ijJVb)Q<0jWOI=_FiCK24AD%G{4e$NQd
zWv*R@_2{PvzvNMu@Y3QBNJJKAzFJ33r_h+}NP7l{uwC<5(0xcl0^=Em4$LS-ZF-5D
zMD(oR`sZ*UYIe*BY*c~7#G1SLTv3VfBTd_C@@TBwsuESuxm7Y0Uf&u{$l-}_?d>yD
z=!O?kq61VegV+st@XCw475j6vS)_z@efuqQgHQR1T4;|-#OLZNQJPV4k$AX1Uk8Lm
z{N*b*ia=I+MB}kWpupJ~>!C@xEN#Wa7V+7{m4j8c?)ChV=D?o~sjT?0C_AQ<J}v#S
zq&&10i;k!wZ0^l<H$PM2AS4v2B7le67PsGi3{5cEJvQTXYQd9$TA$ATXW$sERJFH|
zUFQmh;BXn<X&*(eK7*8b7K+8>7B-vxqX30s0I_`2$in86#`mAsT-w?j{&AL@B3$;P
z31G4(lV|b}uSD<Q-$cmmD#5!{N;ON{%=s}<yxrxZp;&F{OtN|&Osm7~f0ORXV+M%%
zhys!Gh~U9xxTSrb2pKtcmi71qF!D2BtUcc1(uP<LQ-4B<(+;>CIrjk+M1R!X7s<hT
z2KXhB-@~*Z#DnL&I)I4&$X=6)^|><DE!Cgw9m@wB3B0oPTj6$<u_@p0qZd2rpQY_#
zEFr4$jqoGqJSybV){Dvrnb_tOoKmSO#70t@P~q_L%<9+Qb(JW|nv0-SWLrjEuZTVs
z44b8p8-&PiM|E?GM`){f%M?C9*dLm28~DlBW?*4ua4H+nWN_%3iNC_(B+k``Oazc8
z83kgJUNcy2CKRR@Pn1$!R|+BC1lz16vh1Y$6BfKm&WMiaUzg^B!!Zp$xNrq{)ln-H
zcg5u<qf>4Aabn<)zpgT}#gE|mIvV38^ODy@<&yflpCwS#fRf9ZX3lPV_?8@C5)A;T
zqmouFLFk;qIs4rA=hh=GL~sCFsXHsqO6_y~*AFt93<ymU#4-U}YQ)Pa*UpuA%os{2
z&>9UYVBSx1s(=Kb&5;j7cSowdE;7()CC2|-i9Zz+_BIw8#ll~-tyH?F3{%`QCsY<I
zU5z8T?uMPvp*VYrm~~t-K+6Pgjku>a*b#s*9iCc`1P1oC26?`g<9))EJ3%xz+O!B3
zZ7$j~To)C@PquR>a1+Dh>-a%IvH_Y7^ys|4o?E%3`I&ADXfC8++hAdZfzIT#%C+Jz
z1lU~K_vAm0m8Qk}K$F>|<CsjNZ*?_o$*ZsW3W*ZecdNs4Im>>RPK%<1SI0(G+8q~H
zAsjezyP+u!Se4q3GW)`h`NPSRlMoBjCzNPesWJwVTY!o@G8=(6I%4XHGaSiS3MEBK
zhgGFv6Jc>L$4jVE!I?TQuwvz_%CyO!bLh94nqK11C2W$*aa2ueGopG8DnBICVUORP
zgytv#)49fVXDaR$SukloYC3u7#5H)}1K21=?DKj^U)8G;MS)&Op)g^zR2($<>C*zW
z;X7`hLxiIO#J`ANdyAOJle4V%ppa*(+0i3w;8i*BA_;u8gOO6)MY`ueq7stBMJTB;
z-a0R>hT<!E*EnpUxAxCvwvo$2Z}nSc&KEBz0q7{Fm>*}>z|Gg}@^zDL1MrH+2hsR8
zHc}*9IvuQC^Ju)^#Y{fOr(96rQNPNhxc;mH@W*m206>Lo<*SaaH?~8zg&f&%YiOEG
zGiz?*CP>Bci}!WiS=zj#K5I}>DtpregpP_tfZtPa(N<%vo^#WCQ5BTv0vr%Z{)0q+
z)RbfHktUm|lg&U3YM%lMUM(f<ok0JPn&g&>u}i#kjX9h>GYctkx9Mt_8{@s%!K_EI
zScgwy6%_fR?CG<BS|7E|e1Uiu+4N|3CP*{mA6E>JQtmgNAj^h9B#zma<L`GR52{?r
zw=yYEhBrx2I7mEv4WBN$tAM7|KP9m=OTPk^73y)|tA#lJ(mG>MDWgH55pGuY1Gv7D
z;8Psm(vEPiwn#MgJYu4Ty9D|h!?Rj0ddE|&L3S{IP%H4^N!m`60ZwZw^;eg4sk6K{
ziA^`Sbl_4~f&Oo%n;8Ye(tiAdlZKI!Z=|j$5hS|D$bDJ}p{gh$KN&JZYLUjv4h{NY
zBJ>X9z<S-$t-=L{3#MCguo5ug^BN(csELHS6D1V)g#mO1+{f#R(F2A;Jtz>!xfDGY
z+oh_Z&_e#Q(-}>ssZfm=j$D&4W4FNy&-kAO1~#3Im;F)Nwe{(*75(p=P^VI?X<FsK
z+mujv723Y8RTh-aX#a)Qm;PXW^W`h>0GFakfh+X-px4a%Uw@fSbmp9hM1_~R>?Z8+
ziy|e9>8V*`OP}4x5JjdWp}7eX;lVxp5qS}<UzbgS%F%qxg|}u`F%N~wbUq7r3Tq2N
z`L+(4<Yw>0YZek;SNmm7tEeSF*-dI)6U-A%m6YvCgM(}_=k#a6o^%-K4{`B1+}O4x
zztDT%hVb;v#?j`lTvlFQ3aV#zkX=7<v0Xt+SO4-V7;S>;YFLS$uIzb0E3lozs5`Xy
zi~vF+%{z9uLjKvKPhP%x5f<NLNK1Zu_hJxLjLK{w;{*>~7-Gj+%5N`%^=yk*Qn{`>
z;xj&ROY6g`iy2a@{O)V(jk&8#hHACVDXey5a+KDod_Z&}kHM}xt7}Md@pil{2x7E~
zL$k^d2@Ec2XskjrN+IILw;#7((abu;OJii&v3?60x>d_Ma(onIPtcVnX@ELF0aL?T
zSmWiL3(dOFkt!x=1O!_0n(cAzZW+3nHJ{2S>tgSK?~cF<W~g{Uk=X^%saR^iO2-=d
zF*rKVVAPU1W>ha^y(l@-Mr2W$%MN{#af8J;V*>hdq!gx=d0h$T7l}>91Wh07)9CTX
zh2_ZdQCyFOQ)l(}gft0UZ<Qo&@`u@GIyo^7BB;_Jrh>G`Sh2`x-w`5vC2UD}lZs*5
zG76$akzn}Xi))L3oGJ75#pcN=cX3!=57$Ha=hQ2^lwdyU#a}4JJOz6ddR%zae%#4&
za)bFj)z=YQela(F#Y|Q#dp}PJghITwXouVaMq$BM?K%cXn9^Y@g43$=O)F&ZlOUom
zJiad#dea;-eywBA@e&D6Pdso1?2^(pXiN91?jvcaUyYoKUmvl5G9e$W!okWe*@a<^
z8cQQ6cNSf+UPDx%?_G4a<m)UKh(R<crXCvksf8T4MGW_VPMHrJGOqh#<rdAK%kV`|
zqLv2C)0Oba2mQ50>IiybZHHagF{<S-4D+!Tsu-gt1o$)JW!(&V?v-lI1Lv(lQE6R!
zWjXrkjWX-&v!bw*7_u$ws?*dOF^}ann%C)lp)v!U?&S&S%`~VL={@<rBH$gl7F=4D
zs%B$Bo06T#CB)!Sf;LI9_<<tT&#Jv^`mC8{I3pWeU7jyQ0gh;9%B>;IcD(dPO!#=u
zWfqLcPc^+7Uu#l(B<Qg-R1c!j-uotKRCgB)MF*8IZpiA>pxft{*4lv#*u7X9AOzDO
z1D9?^jIo}?%iz(_dwLa{ex#T}76ZfN_Z-hwpus9y+4xaUu9cX}&P{XrZVWE{1^0yw
zO;YhLEW!pJcbCt3L8~a7>jsaN{V3>tz6_7`&pi%GxZ=V3?3K^<rn`e8a7?eZI-TG+
z{hR_I;2c?$BM1)pjP2l@7#6U3^o=*9Hsp__;N;$8F&5@Ghp#>U+*ryLSb)8^IblJ0
zSRLNDvIxt)S}g30?s_3NX>F?NKIGrG_zB9@Z>uSW3k2es_H2kU;Rnn%j5qP)!XHKE
zPB2mHP~tLCg4K_vH$xv`HbRsJwbZMUV(t=ez;Ec(vyHH)FbfLg`c61I$W_uBB>i^r
z&{_P;369-&>23R%qNIULe=1~T$(DA`ev*EWZ6j(B$(te}x1WvmIll21zvygkS%vwG
zzkR6Z#RKA2!z!C%M!O>!=Gr0(J0FP=-MN=5t-Ir)of50y10W}j`GtRCsXBakrKtG&
zazmITDJMA0C51&BnLY)SY9r)NVTMs);1<=oosS9g31l{4ztjD3#+2H7u_|66b|_*O
z;Qk6nalpqdHOjx|K&vUS_6ITgGll;TdaN*ta=M_YtyC)I9Tmr~VaPrH2q<HCA^;;b
zni;6_t9t~p5;T0mX`UW-c?4TAiadb)6}vsp``(hz(}(&x4ab<TyrI|$niD$NiTl-b
zJt9ixO#S|?KYH3Eadm4D8|NzLhAY993hoQanUS>b6sd~=AcIxV+%z{E&0@y=DPArw
zdV7z(G1hBx7hd{>(cr43^WF%4Y@PXZ?wPpj{OQ#tvc$pABJbvPGvdR`cAtHn)cSEV
zrpu}1tJwQ3y!mSmH*uz*x0o|CS<^w%&KJzsj~DU0cLQUxk5B!hWE>aBkjJle8z~;s
z-!A=($+}Jq_BTK5^B!`R>!MulZN)F=iXXeUd0w5lUsE5VP*H*oCy(<w;IZ?{Pso`R
z;9tSfBWDPpv(ru@ok6#>;?S$p*TVvTxwAeWFB$jHyb0593)$zqalVlDX=GcCN1gU0
zlgU)I$LcXZ8Oyc2TZYTPu@-;7<4YYB-``Qa;IDcvydIA$%kHhJKV^m*-<Eu89DD6r
z$hXxW3}1&`pz`)lE8f*kAC}P(6)qA>zxcvU4viy<a-^x1uJC*fAd9KCgjrYHBR=y`
zw#X)*QjS-7i>&Kr5GVM{IT>WRywKQ9;>SEiQD*NqplK-KK4YR`p0@JW)n_{TU3bt0
zim%;(m1=#v2}zTps=?fU5w^(*y)xT%1vtQH&}50ZF!9YxW=&7*W($2kgKyz1mUgfs
zfV<*XVVIFnohW=|j+@Kfo!#liQR^x>2yQdrG;2o8WZR+XzU_nG=Ed2rK?ntA;K5B{
z>M8+*A4<Ta>!Jm^Bg}aW?R?6;@QG@uQ8&oJ{hFixcfEnJ4QH?A4>P=q29oDGW;L;=
z9-a0;g%c`C+Ai!UmK$NC*4#;Jp<1=TioL=t^YM)<<%u#hnnfSS`nq63QKGO1L8RzX
z@MFDq<H`&N7x6|cHF$jHtc;8QSd3*XDI;%h;Be47aqDn+ovE51)i6?}0L%GiJ>s1z
ztYmxDl@LU)5acvHk)~Z`RW7=aJ_nGD!mOSYD>5Odjn@TK#LY{jf?+piB5AM-CAoT_
z?S-*q7}wyLJzK>N%eMPuFgN)Q_otKP;aqy=D5f!<Uxm0kJ!&((NN1Cc$Lf2D8xbv(
z*WfnV!Kme-C7`<}Hk^(!-La76WI@dSiD?t@Imfnp1{N8W$}|)~%wx6MKY2OYwhJDH
z)z%|ULU9X+--|?(ocK})YRZKw<7x0>7<=n(lNkYRXVpkB{TAYLYg{|(jtRqYmg$xH
zjmq<Cf4$wzOeRC1g`5bkE7g|z=wldi@dYy#eUIYfkuubZe|$MvzfnD`b2{>?B(RE4
zQx^~Pt}gxC2~l=K$$-sYy_r$CO(d=+b3H1MB*y_5g6WLaWTXn+TKQ|hNY^>Mp6k*$
zwkovomhu776vQATqT4blf~g;TY(MWCrf^^yfWJvSAB$p5l;jm@o#=!lqw+Lqfq>X=
z$6~kxfm7`3q4zUEB;u4qa#BdJxO!;xGm)wwuisj{0y2x{R(IGMrsIzDY9LW>m!Y`=
z04sx3IjnYvL<4JqxQ8f7qYd0s2Ig%`ytYPEMKI)s(LD}D@EY>x`VFtqvnADNBdeao
zC96X+MxnwKmjpg{U&gP3HE}1=s!lv&D{6(g_lzyF3A`7Jn*&d_kL<;dAFx!UZ>hB8
z5A*%LsAn;VLp>3${0>M?PSQ)9s3}|h2e?TG4_F{}{Cs>#3Q*t$(CUc}M)I}8cPF6%
z=+h(Kh^8)}gj(0}#e7O^FQ6`~fd1#8#!}LMuo3A0bN`o}PYsm!Y}sdOz$+Tegc=qT
z8x`PH$7lvnhJp{kHWb22l;@7B7|4yL4UOOVM0MP_>P%S1Lnid)+k9{+3D+JFa#Pyf
zhVc#&df87APl4W9X)F3pGS>@etfl=_E5tBcVoOfrD4hmVeTY-cj((pkn%n@EgN{0f
zwb_^Rk0I#i<UGQdc-Nmd=Rb)xhox&LXCiL2JOtMf1nJ{Y*CC^NXhbH@kK=kc_`LQd
zpKZRrfMT*+Mhk36qPN<LRtNnRgTK6F!~*AtcX%l1)YCyR^Cg*|aI@K7&6brfZD+JV
zGcqOky{~wE&Wx}Ojr2$00rvimv@fJs@iLuizXDa>ZuHK!l*lN`ceJn(sI{$Fq6nN&
zE<-=0_2WN}m+*ivmIOxB@#~Q-cZ>l136w{#TIJe478`KE7@=a{>SzPHsKLzYAyBQO
zAtuuF$-JSDy_S@6GW0MOE~R)b;+0f%_NMrW(+V#c_d&U8Z9+ec4=HmOHw?gdjF(Lu
zzra<iFcvmxzT>83M_BoO-1b3;9`%&DHfuUY)6YDV21P$C!Rc?mv&{lx#f8oc6?0?x
zK08{WP65?#>(vPfA-c=MCY|<S!ZyNl<um89EGH-nZopot<9vhnMSrJUdliV1$R@h(
zReDzy8)E@8VrU(MTz_4ai}TcxM)B2^Im7X9WBhxiIczSob@_Q~*btJ>%*1_<3D4NX
zeVTi-JGl2uP_2@0F{G({pxQOXt_d{g_CV6b?jNpfUG9;8yle-^4KHRvZs-_2siata
zt+d_T@U$&t*xaD22(fH(W1r$Mo?3dc%Tncm=C6{V9y{v&VT#^1L04vDrLM9qBoZ4@
z6DBN#m57hX7$C(=#$Y5$bJmwA$T8jKD8+6A!-IJwA{WOfs%s}yxUw^?MRZjF$n_KN
z6`_bGXcmE#5e4Ym)aQJ)xg3Pg0@k`iGuHe?f(5LtuzSq=nS^5z>vqU0EuZ&75V%Z{
zYyhRLN^)$c6Ds{f7*FBpE;n5iglx5PkHfWrj3<K%`xq+5RKqKFc8rLQ*ZRbbx$E1#
z3f|;4cOJ3Ebo^39!B`+!g&)irRekwjXNvz=dRTz5`G+KYEbcaaK8WXc9Bd>`x^j^t
z7ntuV`g!9Xg#^3!x)l*}IW=(Tz3>Y5l4uGaB&lz{GDjm2D5S$CExLT`I1#n^lBH7Y
zDgpMag@`iETKAI=p<5E#LTkw<F5K4Wbo)QRuzF*eH_@ivMrE0Wp~Gnj6dqxd?q0<i
zCg50hY}if?yn)!*`4%$BA^3^>zVR@=yY|uBVI1HG|8h+d;G-qfuj}-ZR6fN>EfCCW
z9~wRQoAPEa#aO?3h?x{YvV*d+NtPkf&4V0k4|L=uj!U{L+oLa(z#&iuhJr3-PjO3R
z5s?=nn_5^*^Rawr>>Nr@K(jwkB#JK-=+HqwfdO<+P5byeim)wvqGlP-P|~Nse8=XF
zz`?RYB|D6SwS}C<!9XcXRWqW$6w&z(j$m~}aKHcZK~n4i+541c<|vO(dRs@`mO_la
zV#-mf$jU#l&0!zW|IK42VgGl#Cw`Pp0u0|_KdVe9>+YQv+;}k6$-%D(@+t14BL@vM
z2q%q?f6D-A5s$_WY3{^G0F131bbh|g!}#BKw=HQ7mx;Dzg4Z*bTLQSfo{ed{4}NZW
zfrRm^Ca$rlE{Ue~uYv>R9{3s<lJFO-AA<uH1E0Ejy3!9=Y^Pj|>mwATcdM_6+yWIO
z*ZRH~uXE@#p$XTbCt5j7j2=86e{9>HIB6xDzV+vAo&B?KUiMP|ttOElepnl%|DPqL
b{|{}U^kRn2wo}j7|0ATu<;8xA7zX}7|B6mN

diff --git a/ui/public/manifest.json b/ui/public/manifest.json
index 50a99047f..f6d4ea50a 100644
--- a/ui/public/manifest.json
+++ b/ui/public/manifest.json
@@ -8,14 +8,9 @@
       "type": "image/x-icon"
     },
     {
-      "src": "logo192.png",
+      "src": "logo200.png",
       "type": "image/png",
-      "sizes": "192x192"
-    },
-    {
-      "src": "logo512.png",
-      "type": "image/png",
-      "sizes": "512x512"
+      "sizes": "200x200"
     }
   ],
   "start_url": ".",

From 2f7e1fd066319bf80baa10335b603257c832b13c Mon Sep 17 00:00:00 2001
From: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
Date: Wed, 26 Oct 2022 22:56:24 -0700
Subject: [PATCH 41/68] Refine example notebooks (#756)

Resolves #749, #716, #707
---
 docs/dev_guide/new_contributor_guide.md       |    6 +-
 docs/quickstart_databricks.md                 |    6 +-
 docs/quickstart_synapse.md                    |    2 +-
 .../databricks_quickstart_nyc_taxi_demo.ipynb |    1 +
 ...atabricks_quickstart_nyc_taxi_driver.ipynb | 1442 -----------------
 docs/samples/nyc_taxi_demo.ipynb              | 1110 +++++++++++++
 feathr_project/feathr/client.py               |    2 +-
 feathr_project/feathr/datasets/__init__.py    |    9 +
 feathr_project/feathr/datasets/constants.py   |    3 +
 feathr_project/feathr/datasets/nyc_taxi.py    |   87 +
 feathr_project/feathr/datasets/utils.py       |   64 +
 .../spark_provider/_databricks_submission.py  |  181 ++-
 feathr_project/feathr/utils/config.py         |   61 +
 feathr_project/feathr/utils/job_utils.py      |  218 ++-
 feathr_project/feathr/utils/platform.py       |   45 +
 .../demo_data/green_tripdata_2020-04.csv      |   14 -
 .../product_detail_mock_data.csv              |   11 -
 .../user_observation_mock_data.csv            |   35 -
 .../user_profile_mock_data.csv                |   11 -
 .../user_purchase_history_mock_data.csv       |   31 -
 .../nyc_driver_demo.ipynb                     |  720 --------
 feathr_project/setup.py                       |    3 +-
 feathr_project/test/samples/test_notebooks.py |   56 +
 .../test/unit/datasets/test_dataset_utils.py  |   53 +
 .../test/unit/datasets/test_datasets.py       |  106 ++
 feathr_project/test/unit/utils/test_config.py |   31 +
 26 files changed, 1908 insertions(+), 2400 deletions(-)
 create mode 100755 docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
 delete mode 100644 docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
 create mode 100644 docs/samples/nyc_taxi_demo.ipynb
 create mode 100644 feathr_project/feathr/datasets/__init__.py
 create mode 100644 feathr_project/feathr/datasets/constants.py
 create mode 100644 feathr_project/feathr/datasets/nyc_taxi.py
 create mode 100644 feathr_project/feathr/datasets/utils.py
 create mode 100644 feathr_project/feathr/utils/config.py
 create mode 100644 feathr_project/feathr/utils/platform.py
 delete mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv
 delete mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv
 delete mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv
 delete mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv
 delete mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv
 delete mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
 create mode 100644 feathr_project/test/samples/test_notebooks.py
 create mode 100644 feathr_project/test/unit/datasets/test_dataset_utils.py
 create mode 100644 feathr_project/test/unit/datasets/test_datasets.py
 create mode 100644 feathr_project/test/unit/utils/test_config.py

diff --git a/docs/dev_guide/new_contributor_guide.md b/docs/dev_guide/new_contributor_guide.md
index 1856ffd84..223b7d91b 100644
--- a/docs/dev_guide/new_contributor_guide.md
+++ b/docs/dev_guide/new_contributor_guide.md
@@ -6,11 +6,11 @@ parent: Feathr Developer Guides
 
 # What can I contribute?
 All forms of contributions are welcome, including and not limited to:
-* Improve or contribute new [notebook samples](https://github.com/feathr-ai/feathr/tree/main/feathr_project/feathrcli/data/feathr_user_workspace)
+* Improve or contribute new [notebook samples](https://github.com/feathr-ai/feathr/tree/main/docs/samples)
 * Add tutorial, blog posts, tech talks etc
 * Increase media coverage and exposure
 * Improve user-facing documentation or developer-facing documentation
-* Add testing code 
+* Add testing code
 * Add new features
 * Refactor and improve architecture
 * For any other forms of contribution and collaboration, don't hesitate to reach out to us.
@@ -18,7 +18,7 @@ All forms of contributions are welcome, including and not limited to:
 # I am interested, how can I start?
 If you are new to this project, we recommend start with [`good-first-issue`](https://github.com/feathr-ai/feathr/issues?q=is%3Aissue+is%3Aopen+label%3A%22good+first+issue%22).
 
-The issues are also labled with what types of programming language the task need. 
+The issues are also labled with what types of programming language the task need.
 * [`good-first-issue` and `Python`](https://github.com/feathr-ai/feathr/issues?q=is%3Aopen+label%3A%22good+first+issue%22+label%3Apython)
 * [`good-first-issue` and `Scala`](https://github.com/feathr-ai/feathr/issues?q=is%3Aopen+label%3A%22good+first+issue%22+label%3Ascala)
 * [`good-first-issue` and `Java`](https://github.com/feathr-ai/feathr/issues?q=is%3Aopen+label%3A%22good+first+issue%22+label%3Ajava)
diff --git a/docs/quickstart_databricks.md b/docs/quickstart_databricks.md
index dff5b5f0f..30eaaa835 100644
--- a/docs/quickstart_databricks.md
+++ b/docs/quickstart_databricks.md
@@ -5,13 +5,13 @@ title: Quick Start Guide with Databricks
 
 # Feathr Quick Start Guide with Databricks
 
-For Databricks, you can simply upload [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb) to your Databricks cluster and just run it in the Databricks cluster. It has been pre-configured to use the current Databricks cluster to submit jobs.
+For Databricks, you can simply upload [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb) to your Databricks cluster and just run it in the Databricks cluster. It has been pre-configured to use the current Databricks cluster to submit jobs.
 
 1. Import Notebooks in your Databricks cluster:
 
 ![Import Notebooks](./images/databricks_quickstart1.png)
 
-2. Paste the [link to Databricks getting started notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb):
+2. Paste the [link to Databricks getting started notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb):
 
 ![Import Notebooks](./images/databricks_quickstart2.png)
 
@@ -21,7 +21,7 @@ For Databricks, you can simply upload [this notebook](./samples/databricks/datab
 
 Although Databricks Notebooks are great tools, there are also large developer communities that prefer the usage of Visual Studio Code, where [it has native support for Python and Jupyter Notebooks](https://code.visualstudio.com/docs/datascience/jupyter-notebooks) with many great features such as syntax highlight and IntelliSense.
 
-In [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb), there are a few lines of code like this:
+In [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb), there are a few lines of code like this:
 
 ```python
 # Get current databricks notebook context
diff --git a/docs/quickstart_synapse.md b/docs/quickstart_synapse.md
index 0a66a96bb..5c5a2ca29 100644
--- a/docs/quickstart_synapse.md
+++ b/docs/quickstart_synapse.md
@@ -24,7 +24,7 @@ Feathr has native cloud integration. Here are the steps to use Feathr on Azure:
 
 1. Follow the [Feathr ARM deployment guide](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to run Feathr on Azure. This allows you to quickly get started with automated deployment using Azure Resource Manager template. Alternatively, if you want to set up everything manually, you can checkout the [Feathr CLI deployment guide](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) to run Feathr on Azure. This allows you to understand what is going on and set up one resource at a time.
 
-2. Once the deployment is complete,run the Feathr Jupyter Notebook by clicking this button:  [![Binder](https://mybinder.org/badge_logo.svg)](https://mybinder.org/v2/gh/feathr-ai/feathr/main?labpath=feathr_project%2Ffeathrcli%2Fdata%2Ffeathr_user_workspace%2Fnyc_driver_demo.ipynb). 
+2. Once the deployment is complete,run the Feathr Jupyter Notebook by clicking this button:  [![Binder](https://mybinder.org/badge_logo.svg)](https://mybinder.org/v2/gh/feathr-ai/feathr/main?labpath=docs%2Fsamples%2Fnyc_taxi_demo.ipynb).
 3. You only need to change the specified `Resource Prefix`.
 
 ## Step 2: Install Feathr
diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
new file mode 100755
index 000000000..d5d7152d1
--- /dev/null
+++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
@@ -0,0 +1 @@
+{"cells":[{"cell_type":"code","source":["dbutils.widgets.text(\"RESOURCE_PREFIX\", \"\")\ndbutils.widgets.text(\"REDIS_KEY\", \"\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"843d3142-24ca-4bd1-9e31-b55163804fe3"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["# Feathr Feature Store on Databricks Demo Notebook\n\nThis notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n\nThis notebook is specifically written for Databricks and is relying on some of the Databricks packages such as `dbutils`. The intention here is to provide a \"one click run\" example with minimum configuration. For example:\n- This notebook skips feature registry which requires running Azure Purview. \n- To make the online feature query work, you will need to configure the Redis endpoint. \n\nThe full-fledged notebook can be found from [here](https://github.com/feathr-ai/feathr/blob/main/docs/samples/nyc_taxi_demo.ipynb)."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"384e5e16-7213-4186-9d04-09d03b155534"}}},{"cell_type":"markdown","source":["## Prerequisite\n\nTo use feathr materialization for online scoring with Redis cache, you may deploy a Redis cluster and set `RESOURCE_PREFIX` and `REDIS_KEY` via Databricks widgets. Note that the deployed Redis host address should be `{RESOURCE_PREFIX}redis.redis.cache.windows.net`. More details about how to deploy the Redis cluster can be found [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html#configurure-redis-cluster).\n\nTo run this notebook, you'll need to install `feathr` pip package. Here, we install notebook-scoped library. For details, please see [Azure Databricks dependency management document](https://learn.microsoft.com/en-us/azure/databricks/libraries/)."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c2ce58c7-9263-469a-bbb7-43364ddb07b8"}}},{"cell_type":"code","source":["!pip install feathr"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"4609d7ad-ad74-40fc-b97e-f440a0fa0737"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## Notebook Steps\n\nThis tutorial demonstrates the key capabilities of Feathr, including:\n\n1. Install Feathr and necessary dependencies.\n1. Create shareable features with Feathr feature definition configs.\n1. Create training data using point-in-time correct feature join\n1. Train and evaluate a prediction model.\n1. Materialize feature values for online scoring.\n\nThe overall data flow is as follows:\n\n<img src=\"https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true\" width=\"800\">"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c81fa80c-bca6-4ae5-84ad-659a036977bd"}}},{"cell_type":"code","source":["from datetime import datetime, timedelta\nimport glob\nimport json\nfrom math import sqrt\nimport os\nfrom pathlib import Path\nimport requests\nfrom tempfile import TemporaryDirectory\n\nfrom azure.identity import AzureCliCredential, DefaultAzureCredential \nfrom azure.keyvault.secrets import SecretClient\nimport pandas as pd\nfrom pyspark.ml import Pipeline\nfrom pyspark.ml.evaluation import RegressionEvaluator\nfrom pyspark.ml.feature import VectorAssembler\nfrom pyspark.ml.regression import GBTRegressor\nfrom pyspark.sql import DataFrame, SparkSession\nimport pyspark.sql.functions as F\n\nimport feathr\nfrom feathr import (\n    FeathrClient,\n    # Feature data types\n    BOOLEAN, FLOAT, INT32, ValueType,\n    # Feature data sources\n    INPUT_CONTEXT, HdfsSource,\n    # Feature aggregations\n    TypedKey, WindowAggTransformation,\n    # Feature types and anchor\n    DerivedFeature, Feature, FeatureAnchor,\n    # Materialization\n    BackfillTime, MaterializationSettings, RedisSink,\n    # Offline feature computation\n    FeatureQuery, ObservationSettings,\n)\nfrom feathr.datasets import nyc_taxi\nfrom feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\nfrom feathr.utils.config import generate_config\nfrom feathr.utils.job_utils import get_result_df\n\n\nprint(f\"\"\"Feathr version: {feathr.__version__}\nDatabricks runtime version: {spark.conf.get(\"spark.databricks.clusterUsageTags.sparkVersion\")}\"\"\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"80223a02-631c-40c8-91b3-a037249ffff9"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 2. Create Shareable Features with Feathr Feature Definition Configs\n\nIn this notebook, we define all the necessary resource key values for authentication. We use the values passed by the databricks widgets at the top of this notebook. Instead of manually entering the values to the widgets, we can also use [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) to retrieve them.\nPlease refer to [how-to guide documents for granting key-vault access](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html#3-grant-key-vault-and-synapse-access-to-selected-users-optional) and [Databricks' Azure Key Vault-backed scopes](https://learn.microsoft.com/en-us/azure/databricks/security/secrets/secret-scopes) for more details."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"ab35fa01-b392-457e-8fde-7e445a3c39b5"}}},{"cell_type":"code","source":["RESOURCE_PREFIX = dbutils.widgets.get(\"RESOURCE_PREFIX\")\nPROJECT_NAME = \"feathr_getting_started\"\n\nREDIS_KEY = dbutils.widgets.get(\"REDIS_KEY\")\n\n# Use a databricks cluster\nSPARK_CLUSTER = \"databricks\"\n\n# Databricks file system path\nDATA_STORE_PATH = f\"dbfs:/{PROJECT_NAME}\""],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"09f93a9f-7b33-4d91-8f31-ee3b20991696"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["In the following cell, we set required databricks credentials automatically by using a databricks notebook context object as well as new job cluster spec.\n\nNote: When submitting jobs, Databricks recommend to use new clusters for greater reliability. If you want to use an existing all-purpose cluster, you may set\n`existing_cluster_id': ctx.tags().get('clusterId').get()` to the `databricks_config`, replacing `new_cluster` config values."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"41d3648a-9bc9-40dc-90da-bc82b21ef9b3"}}},{"cell_type":"code","source":["# Redis credential\nos.environ['REDIS_PASSWORD'] = REDIS_KEY\n\n# Setup databricks env configs\nctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\ndatabricks_config = {\n    'run_name': \"FEATHR_FILL_IN\",\n    # To use an existing all-purpose cluster:\n    # 'existing_cluster_id': ctx.tags().get('clusterId').get(),\n    # To use a new job cluster:\n    'new_cluster': {\n        'spark_version': \"11.2.x-scala2.12\",\n        'node_type_id': \"Standard_D3_v2\",\n        'num_workers':1,\n        'spark_conf': {\n            'FEATHR_FILL_IN': \"FEATHR_FILL_IN\",\n            # Exclude conflicting packages if use feathr <= v0.8.0:\n            'spark.jars.excludes': \"commons-logging:commons-logging,org.slf4j:slf4j-api,com.google.protobuf:protobuf-java,javax.xml.bind:jaxb-api\",\n        },\n    },\n    'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n    'spark_jar_task': {\n        'main_class_name': \"FEATHR_FILL_IN\",\n        'parameters': [\"FEATHR_FILL_IN\"],\n    },\n}\nos.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\nos.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\nos.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\nos.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"331753d6-1850-47b5-ad97-84b7c01d79d1"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Configurations\n\nFeathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee"}}},{"cell_type":"code","source":["config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n\nwith open(config_path, 'r') as f: \n    print(f.read())"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"8cd64e3a-376c-48e6-ba41-5197f3591d48"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"58d22dc1-7590-494d-94ca-3e2488c31c8e"}}},{"cell_type":"markdown","source":["### Initialize Feathr Client"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"3fef7f2f-df19-4f53-90a5-ff7999ed983d"}}},{"cell_type":"code","source":["client = FeathrClient(config_path=config_path)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"9713a2df-c7b2-4562-88b0-b7acce3cc43a"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### View the NYC taxi fare dataset"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c3b64bda-d42c-4a64-b976-0fb604cf38c5"}}},{"cell_type":"code","source":["DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n\n# Download the data file\ndf_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\ndf_raw.limit(5).toPandas()"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c4ccd7b3-298a-4e5a-8eec-b7e309db393e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Defining features with Feathr\n\nIn Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n\n* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n\nNote that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n\nThere are two types of features -- anchored features and derivated features:\n\n* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n* **Derived features**: Features that are computed on top of other features.\n\n#### Define anchored features\n\nA feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"7430c942-64e5-4b70-b823-16ce1d1b3cee"}}},{"cell_type":"code","source":["TIMESTAMP_COL = \"lpep_dropoff_datetime\"\nTIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"75b8d2ed-84df-4446-ae07-5f715434f3ea"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# We define f_trip_distance and f_trip_time_duration features separately\n# so that we can reuse them later for the derived features.\nf_trip_distance = Feature(\n    name=\"f_trip_distance\",\n    feature_type=FLOAT,\n    transform=\"trip_distance\",\n)\nf_trip_time_duration = Feature(\n    name=\"f_trip_time_duration\",\n    feature_type=FLOAT,\n    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n)\n\nfeatures = [\n    f_trip_distance,\n    f_trip_time_duration,\n    Feature(\n        name=\"f_is_long_trip_distance\",\n        feature_type=BOOLEAN,\n        transform=\"trip_distance > 30.0\",\n    ),\n    Feature(\n        name=\"f_day_of_week\",\n        feature_type=INT32,\n        transform=\"dayofweek(lpep_dropoff_datetime)\",\n    ),\n    Feature(\n        name=\"f_day_of_month\",\n        feature_type=INT32,\n        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n    ),\n    Feature(\n        name=\"f_hour_of_day\",\n        feature_type=INT32,\n        transform=\"hour(lpep_dropoff_datetime)\",\n    ),\n]\n\n# After you have defined features, bring them together to build the anchor to the source.\nfeature_anchor = FeatureAnchor(\n    name=\"feature_anchor\",\n    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n    features=features,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"93abbcc2-562b-47e4-ad4c-1fedd7cc64df"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["We can define the source with a preprocessing python function."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"728d2d5f-c11f-4941-bdc5-48507f5749f1"}}},{"cell_type":"code","source":["def preprocessing(df: DataFrame) -> DataFrame:\n    import pyspark.sql.functions as F\n    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n    return df\n\nbatch_source = HdfsSource(\n    name=\"nycTaxiBatchSource\",\n    path=DATA_FILE_PATH,\n    event_timestamp_column=TIMESTAMP_COL,\n    preprocessing=preprocessing,\n    timestamp_format=TIMESTAMP_FORMAT,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"3cc59a0e-a41b-480e-a84e-ca5443d63143"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["For the features with aggregation, the supported functions are as follows:\n\n| Aggregation Function | Input Type | Description |\n| --- | --- | --- |\n|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n|LATEST| Any |Returns the latest not-null values from within the defined time window |"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"46f863c4-bb81-434a-a448-6b585031a221"}}},{"cell_type":"code","source":["agg_key = TypedKey(\n    key_column=\"DOLocationID\",\n    key_column_type=ValueType.INT32,\n    description=\"location id in NYC\",\n    full_name=\"nyc_taxi.location_id\",\n)\n\nagg_window = \"90d\"\n\n# Anchored features with aggregations\nagg_features = [\n    Feature(\n        name=\"f_location_avg_fare\",\n        key=agg_key,\n        feature_type=FLOAT,\n        transform=WindowAggTransformation(\n            agg_expr=\"fare_amount_cents\",\n            agg_func=\"AVG\",\n            window=agg_window,\n        ),\n    ),\n    Feature(\n        name=\"f_location_max_fare\",\n        key=agg_key,\n        feature_type=FLOAT,\n        transform=WindowAggTransformation(\n            agg_expr=\"fare_amount_cents\",\n            agg_func=\"MAX\",\n            window=agg_window,\n        ),\n    ),\n]\n\nagg_feature_anchor = FeatureAnchor(\n    name=\"agg_feature_anchor\",\n    source=batch_source,  # External data source for feature. Typically a data table.\n    features=agg_features,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"a373ecbe-a040-4cd3-9d87-0d5f4c5ba553"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["#### Define derived features\n\nWe also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"149f85e2-fa3c-4895-b0c5-de5543ca9b6d"}}},{"cell_type":"code","source":["derived_features = [\n    DerivedFeature(\n        name=\"f_trip_time_distance\",\n        feature_type=FLOAT,\n        input_features=[\n            f_trip_distance,\n            f_trip_time_duration,\n        ],\n        transform=\"f_trip_distance / f_trip_time_duration\",\n    )\n]"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"05633bc3-9118-449b-9562-45fc437576c2"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Build features\n\nFinally, we build the features."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"ad102c45-586d-468c-85f0-9454401ef10b"}}},{"cell_type":"code","source":["client.build_features(\n    anchor_list=[feature_anchor, agg_feature_anchor],\n    derived_feature_list=derived_features,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"91bb5ebb-87e4-470b-b8eb-1c89b351740e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 3. Create Training Data Using Point-in-Time Correct Feature Join\n\nAfter the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n\nTo create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\nwhat features and how these features should be joined to the observation data. \n\nTo learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"632d5f46-f9e2-41a8-aab7-34f75206e2aa"}}},{"cell_type":"code","source":["feature_names = [feature.name for feature in features + agg_features + derived_features]\nfeature_names"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"02feabc9-2f2f-43e8-898d-b28082798e98"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["DATA_FORMAT = \"parquet\"\noffline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# Features that we want to request. Can use a subset of features\nquery = FeatureQuery(\n    feature_list=feature_names,\n    key=agg_key,\n)\nsettings = ObservationSettings(\n    observation_path=DATA_FILE_PATH,\n    event_timestamp_column=TIMESTAMP_COL,\n    timestamp_format=TIMESTAMP_FORMAT,\n)\nclient.get_offline_features(\n    observation_settings=settings,\n    feature_query=query,\n    # Note, execution_configurations argument only works when using a new job cluster\n    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n    execution_configurations=SparkExecutionConfiguration({\n        \"spark.feathr.outputFormat\": DATA_FORMAT,\n    }),\n    output_path=offline_features_path,\n)\n\nclient.wait_job_to_finish(timeout_sec=500)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"67e81466-c736-47ba-b122-e640642c01cf"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# Show feature results\ndf = get_result_df(\n    spark=spark,\n    client=client,\n    data_format=\"parquet\",\n    res_url=offline_features_path,\n)\ndf.select(feature_names).limit(5).toPandas()"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"9871af55-25eb-41ee-a58a-fda74b1a174e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 4. Train and Evaluate a Prediction Model\n\nAfter generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n\nNote that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f"}}},{"cell_type":"markdown","source":["### Load Train and Test Data from the Offline Feature Values"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"5a226026-1c7b-48db-8f91-88d5c2ddf023"}}},{"cell_type":"code","source":["# Train / test split\ntrain_df, test_df = (\n    df  # Dataframe that we generated from get_offline_features call.\n    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n    .where(F.col(\"f_trip_time_duration\") > 0)\n    .fillna(0)\n    .randomSplit([0.8, 0.2])\n)\n\nprint(f\"Num train samples: {train_df.count()}\")\nprint(f\"Num test samples: {test_df.count()}\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"bd2cdc83-0920-46e8-9454-e5e6e7832ce0"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Build a ML Pipeline\n\nHere, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd"}}},{"cell_type":"code","source":["# Generate a feature vector column for SparkML\nvector_assembler = VectorAssembler(\n    inputCols=[x for x in df.columns if x in feature_names],\n    outputCol=\"features\",\n)\n\n# Define a model\ngbt = GBTRegressor(\n    featuresCol=\"features\",\n    maxIter=100,\n    maxDepth=5,\n    maxBins=16,\n)\n\n# Create a ML pipeline\nml_pipeline = Pipeline(stages=[\n    vector_assembler,\n    gbt,\n])"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"2a254361-63e9-45b2-8c19-40549762eacb"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Train and Evaluate the Model"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"bef93538-9591-4247-97b6-289d2055b7b1"}}},{"cell_type":"code","source":["# Train a model\nmodel = ml_pipeline.fit(train_df)\n\n# Make predictions\npredictions = model.transform(test_df)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"0c3d5f35-11a3-4644-9992-5860169d8302"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# Evaluate\nevaluator = RegressionEvaluator(\n    labelCol=\"label\",\n    predictionCol=\"prediction\",\n)\n\nrmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\nmae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\nprint(f\"RMSE: {rmse}\\nMAE: {mae}\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"1f9b584c-6228-4a02-a6c3-9b8dd2b78091"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\npredictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n\npredictions_pdf.plot(\n    x=\"index\",\n    y=[\"label\", \"prediction\"],\n    style=['-', ':'],\n    figsize=(20, 10),\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"25c33abd-6e87-437d-a6a1-86435f065a1e"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["predictions_pdf.plot.scatter(\n    x=\"label\",\n    y=\"prediction\",\n    xlim=(0, 100),\n    ylim=(0, 100),\n    figsize=(10, 10),\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"664d78cc-4a92-430c-9e05-565ba904558e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 5. Materialize Feature Values for Online Scoring\n\nWhile we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n\nNote, only the features anchored to offline data source can be materialized."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"8a56d165-c813-4ce0-8ae6-9f4d313c463d"}}},{"cell_type":"code","source":["materialized_feature_names = [feature.name for feature in agg_features]\nmaterialized_feature_names"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"751fa72e-8f94-40a1-994e-3e8315b51d37"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["if REDIS_KEY and RESOURCE_PREFIX:\n    FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n\n    # Get the last date from the dataset\n    backfill_timestamp = (\n        df_raw\n        .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n        .agg({TIMESTAMP_COL: \"max\"})\n        .collect()[0][0]\n    )\n\n    # Time range to materialize\n    backfill_time = BackfillTime(\n        start=backfill_timestamp,\n        end=backfill_timestamp,\n        step=timedelta(days=1),\n    )\n\n    # Destinations:\n    # For online store,\n    redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n\n    # For offline store,\n    # adls_sink = HdfsSink(output_path=)\n\n    settings = MaterializationSettings(\n        name=FEATURE_TABLE_NAME + \".job\",  # job name\n        backfill_time=backfill_time,\n        sinks=[redis_sink],  # or adls_sink\n        feature_names=materialized_feature_names,\n    )\n\n    client.materialize_features(\n        settings=settings,\n        # Note, execution_configurations argument only works when using a new job cluster\n        execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n    )\n\n    client.wait_job_to_finish(timeout_sec=500)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"4d4699ed-42e6-408f-903d-2f799284f4b6"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["Now, you can retrieve features for online scoring as follows:"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"5aa13acd-58ec-4fc2-86bb-dc1d9951ebb9"}}},{"cell_type":"code","source":["if REDIS_KEY and RESOURCE_PREFIX:\n    # Note, to get a single key, you may use client.get_online_features instead\n    materialized_feature_values = client.multi_get_online_features(\n        feature_table=FEATURE_TABLE_NAME,\n        keys=[\"239\", \"265\"],\n        feature_names=materialized_feature_names,\n    )\n    materialized_feature_values"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"424bc9eb-a47f-4b46-be69-8218d55e66ad"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## Cleanup"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"3596dc71-a363-4b6a-a169-215c89978558"}}},{"cell_type":"code","source":["# Remove temporary files\ndbutils.fs.rm(\"dbfs:/tmp/\", recurse=True)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"b5fb292e-bbb6-4dd7-8e79-c62d9533e820"}},"outputs":[],"execution_count":0}],"metadata":{"kernelspec":{"display_name":"Python 3.8.10 ('logistics')","language":"python","name":"python3"},"language_info":{"mimetype":"text/x-python","name":"python","pygments_lexer":"ipython3","codemirror_mode":{"name":"ipython","version":3},"version":"3.8.10","nbconvert_exporter":"python","file_extension":".py"},"vscode":{"interpreter":{"hash":"6d25d3d1f1809ed0384c3d8e0cd4f1df57fe7bb936ead67f035c6ff1494f4e23"}},"application/vnd.databricks.v1+notebook":{"notebookName":"databricks_quickstart_nyc_taxi_demo","dashboards":[],"notebookMetadata":{"pythonIndentUnit":4},"language":"python","widgets":{"REDIS_KEY":{"nuid":"d39ce0d5-bcfe-47ef-b3d9-eff67e5cdeca","currentValue":"","widgetInfo":{"widgetType":"text","name":"REDIS_KEY","defaultValue":"","label":null,"options":{"widgetType":"text","validationRegex":null}}},"RESOURCE_PREFIX":{"nuid":"87a26035-86fc-4dbd-8dd0-dc546c1c63c1","currentValue":"","widgetInfo":{"widgetType":"text","name":"RESOURCE_PREFIX","defaultValue":"","label":null,"options":{"widgetType":"text","validationRegex":null}}}},"notebookOrigID":2365994027381987}},"nbformat":4,"nbformat_minor":0}
diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
deleted file mode 100644
index 52790f884..000000000
--- a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
+++ /dev/null
@@ -1,1442 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "384e5e16-7213-4186-9d04-09d03b155534",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "# Feathr Feature Store on Databricks Demo Notebook\n",
-        "\n",
-        "This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. This is a notebook that's specially designed for databricks clusters and is relying on some of the databricks packages such as dbutils.\n",
-        "\n",
-        "The intent of this notebook is like \"one click run\" without configuring anything, so it has relatively limited capability. \n",
-        "\n",
-        "- For example, in this notebook there's no feature registry available since that requires running Azure Purview. \n",
-        "- Also for online store (Redis), you need to configure the Redis endpoint, otherwise that part will not work. \n",
-        "\n",
-        "However, the core part of Feathr, especially defining features, get offline features, point-in-time joins etc., should \"just work\". The full-fledged notebook is [located here](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb)."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\n",
-        "# Notebook Steps\n",
-        "\n",
-        "This tutorial demonstrates the key capabilities of Feathr, including:\n",
-        "\n",
-        "1. Install and set up Feathr with Azure\n",
-        "2. Create shareable features with Feathr feature definition configs.\n",
-        "3. Create a training dataset via point-in-time feature join.\n",
-        "4. Compute and write features.\n",
-        "5. Train a model using these features to predict fares.\n",
-        "6. Materialize feature value to online store.\n",
-        "7. Fetch feature value in real-time from online store for online scoring.\n",
-        "\n",
-        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The feature flow is as below:\n",
-        "\n",
-        "![Feature Flow](https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true)"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "f00b9d0b-94d1-418f-89b9-25bbacb8b068",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "! pip install feathr pandavro scikit-learn"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "80223a02-631c-40c8-91b3-a037249ffff9",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "import glob\n",
-        "import os\n",
-        "import tempfile\n",
-        "from datetime import datetime, timedelta\n",
-        "from math import sqrt\n",
-        "\n",
-        "import pandas as pd\n",
-        "import pandavro as pdx\n",
-        "from feathr import FeathrClient\n",
-        "from feathr import BOOLEAN, FLOAT, INT32, ValueType\n",
-        "from feathr import Feature, DerivedFeature, FeatureAnchor\n",
-        "from feathr import BackfillTime, MaterializationSettings\n",
-        "from feathr import FeatureQuery, ObservationSettings\n",
-        "from feathr import RedisSink\n",
-        "from feathr import INPUT_CONTEXT, HdfsSource\n",
-        "from feathr import WindowAggTransformation\n",
-        "from feathr import TypedKey\n",
-        "from sklearn.metrics import mean_squared_error\n",
-        "from sklearn.model_selection import train_test_split\n",
-        "from azure.identity import DefaultAzureCredential\n",
-        "from azure.keyvault.secrets import SecretClient\n",
-        "import json\n",
-        "import requests"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "41d3648a-9bc9-40dc-90da-bc82b21ef9b3",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "Get the required databricks credentials automatically:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "331753d6-1850-47b5-ad97-84b7c01d79d1",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "# Get current databricks notebook context\n",
-        "ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n",
-        "host_name = ctx.tags().get(\"browserHostName\").get()\n",
-        "host_token = ctx.apiToken().get()\n",
-        "cluster_id = ctx.tags().get(\"clusterId\").get()\n",
-        "\n",
-        "\n",
-        "\n",
-        "# databricks_config = {'run_name':'FEATHR_FILL_IN','existing_cluster_id':cluster_id,'libraries':[{'jar':'FEATHR_FILL_IN'}],'spark_jar_task':{'main_class_name':'FEATHR_FILL_IN','parameters':['FEATHR_FILL_IN']}}\n",
-        "os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + host_name\n",
-        "os.environ['spark_config__databricks__config_template']='{\"run_name\":\"FEATHR_FILL_IN\",\"new_cluster\":{\"spark_version\":\"10.4.x-scala2.12\",\"node_type_id\":\"Standard_D3_v2\",\"num_workers\":2,\"spark_conf\":{\"FEATHR_FILL_IN\":\"FEATHR_FILL_IN\"}},\"libraries\":[{\"jar\":\"FEATHR_FILL_IN\"}],\"spark_jar_task\":{\"main_class_name\":\"FEATHR_FILL_IN\",\"parameters\":[\"FEATHR_FILL_IN\"]}}'\n",
-        "# os.environ['spark_config__databricks__config_template']=json.dumps(databricks_config)\n",
-        "os.environ['spark_config__databricks__work_dir']='dbfs:/feathr_getting_started'\n",
-        "os.environ['project_config__project_name']='feathr_getting_started'\n",
-        "os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = host_token"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "You need to setup the Redis credentials below in order to push features to online store. You can skip this part if you don't have Redis, but there  will be failures for `client.materialize_features(settings)` API."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "# Get redis credentials; This is to parse Redis connection string.\n",
-        "redis_port=\"\"\n",
-        "redis_host=\"\"\n",
-        "redis_password=\"\"\n",
-        "redis_ssl=\"\"\n",
-        "\n",
-        "# Set the resource link\n",
-        "os.environ['online_store__redis__host'] = redis_host\n",
-        "os.environ['online_store__redis__port'] = redis_port\n",
-        "os.environ['online_store__redis__ssl_enabled'] = redis_ssl\n",
-        "os.environ['REDIS_PASSWORD']=redis_password"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "Configure required credentials (skip if you don't use those):"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "8cd64e3a-376c-48e6-ba41-5197f3591d48",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "import tempfile\n",
-        "yaml_config = \"\"\"\n",
-        "# Please refer to https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
-        "api_version: 1\n",
-        "project_config:\n",
-        "  project_name: 'feathr_getting_started2'\n",
-        "  required_environment_variables:\n",
-        "    - 'REDIS_PASSWORD'\n",
-        "offline_store:\n",
-        "  adls:\n",
-        "    adls_enabled: true\n",
-        "  wasb:\n",
-        "    wasb_enabled: true\n",
-        "  s3:\n",
-        "    s3_enabled: false\n",
-        "    s3_endpoint: ''\n",
-        "  jdbc:\n",
-        "    jdbc_enabled: false\n",
-        "    jdbc_database: ''\n",
-        "    jdbc_table: ''\n",
-        "  snowflake:\n",
-        "    snowflake_enabled: false\n",
-        "    url: \"<replace_with_your_snowflake_account>.snowflakecomputing.com\"\n",
-        "    user: \"<replace_with_your_user>\"\n",
-        "    role: \"<replace_with_your_user_role>\"\n",
-        "spark_config:\n",
-        "  # choice for spark runtime. Currently support: azure_synapse, databricks\n",
-        "  # The `databricks` configs will be ignored if `azure_synapse` is set and vice versa.\n",
-        "  spark_cluster: \"databricks\"\n",
-        "  spark_result_output_parts: \"1\"\n",
-        "\n",
-        "online_store:\n",
-        "  redis:\n",
-        "    host: '<replace_with_your_redis>.redis.cache.windows.net'\n",
-        "    port: 6380\n",
-        "    ssl_enabled: True\n",
-        "feature_registry:\n",
-        "  api_endpoint: \"https://<replace_with_your_api_endpoint>.azurewebsites.net/api/v1\"\n",
-        "\"\"\"\n",
-        "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
-        "with open(tmp.name, \"w\") as text_file:\n",
-        "    text_file.write(yaml_config)\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "3fef7f2f-df19-4f53-90a5-ff7999ed983d",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "# Initialize Feathr Client"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "9713a2df-c7b2-4562-88b0-b7acce3cc43a",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "client = FeathrClient(config_path=tmp.name)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "c3b64bda-d42c-4a64-b976-0fb604cf38c5",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## View the data\n",
-        "\n",
-        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The data is as below"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "c4ccd7b3-298a-4e5a-8eec-b7e309db393e",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "import pandas as pd\n",
-        "pd.read_csv(\"https://azurefeathrstorage.blob.core.windows.net/public/sample_data/green_tripdata_2020-04_with_index.csv\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "7430c942-64e5-4b70-b823-16ce1d1b3cee",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## Defining Features with Feathr\n",
-        "\n",
-        "In Feathr, a feature is viewed as a function, mapping from entity id or key, and timestamp to a feature value. For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/linkedin/feathr/blob/main/docs/concepts/feature-definition.md)\n",
-        "\n",
-        "\n",
-        "1. The typed key (a.k.a. entity id) identifies the subject of feature, e.g. a user id, 123.\n",
-        "2. The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n",
-        "3. The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "16420730-582e-4e11-a343-efc0ddd35108",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "Note that, in some cases, such as features defined on top of request data, may have no entity key or timestamp.\n",
-        "It is merely a function/transformation executing against request data at runtime.\n",
-        "For example, the day of week of the request, which is calculated by converting the request UNIX timestamp."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "728d2d5f-c11f-4941-bdc5-48507f5749f1",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "### Define Sources Section with UDFs\n",
-        "A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. See the python documentation to get the details on each input column."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "3cc59a0e-a41b-480e-a84e-ca5443d63143",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "batch_source = HdfsSource(name=\"nycTaxiBatchSource\",\n",
-        "                          path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
-        "                          event_timestamp_column=\"lpep_dropoff_datetime\",\n",
-        "                          timestamp_format=\"yyyy-MM-dd HH:mm:ss\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "46f863c4-bb81-434a-a448-6b585031a221",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "### Define Anchors and Features\n",
-        "A feature is called an anchored feature when the feature is directly extracted from the source data, rather than computed on top of other features. The latter case is called derived feature."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "a373ecbe-a040-4cd3-9d87-0d5f4c5ba553",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "f_trip_distance = Feature(name=\"f_trip_distance\",\n",
-        "                          feature_type=FLOAT, transform=\"trip_distance\")\n",
-        "\n",
-        "features = [\n",
-        "    f_trip_distance,\n",
-        "    Feature(name=\"f_is_long_trip_distance\",\n",
-        "            feature_type=BOOLEAN,\n",
-        "            transform=\"cast_float(trip_distance)>30\"),\n",
-        "    Feature(name=\"f_day_of_week\",\n",
-        "            feature_type=INT32,\n",
-        "            transform=\"dayofweek(lpep_dropoff_datetime)\"),\n",
-        "]\n",
-        "\n",
-        "request_anchor = FeatureAnchor(name=\"request_features\",\n",
-        "                               source=INPUT_CONTEXT,\n",
-        "                               features=features)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "149f85e2-fa3c-4895-b0c5-de5543ca9b6d",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "### Window aggregation features\n",
-        "\n",
-        "For window aggregation features, see the supported fields below:\n",
-        "\n",
-        "Note that the `agg_func` should be any of these:\n",
-        "\n",
-        "| Aggregation Type | Input Type | Description |\n",
-        "| --- | --- | --- |\n",
-        "|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n",
-        "|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n",
-        "|LATEST| Any |Returns the latest not-null values from within the defined time window |\n",
-        "\n",
-        "\n",
-        "After you have defined features and sources, bring them together to build an anchor:\n",
-        "\n",
-        "\n",
-        "Note that if the data source is from the observation data, the `source` section should be `INPUT_CONTEXT` to indicate the source of those defined anchors."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "05633bc3-9118-449b-9562-45fc437576c2",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "location_id = TypedKey(key_column=\"DOLocationID\",\n",
-        "                       key_column_type=ValueType.INT32,\n",
-        "                       description=\"location id in NYC\",\n",
-        "                       full_name=\"nyc_taxi.location_id\")\n",
-        "agg_features = [Feature(name=\"f_location_avg_fare\",\n",
-        "                        key=location_id,\n",
-        "                        feature_type=FLOAT,\n",
-        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
-        "                                                          agg_func=\"AVG\",\n",
-        "                                                          window=\"90d\")),\n",
-        "                Feature(name=\"f_location_max_fare\",\n",
-        "                        key=location_id,\n",
-        "                        feature_type=FLOAT,\n",
-        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
-        "                                                          agg_func=\"MAX\",\n",
-        "                                                          window=\"90d\")),\n",
-        "                ]\n",
-        "\n",
-        "agg_anchor = FeatureAnchor(name=\"aggregationFeatures\",\n",
-        "                           source=batch_source,\n",
-        "                           features=agg_features)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "d2ecaca9-057e-4b36-811f-320f66f753ed",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "### Derived Features Section\n",
-        "Derived features are the features that are computed from other features. They could be computed from anchored features, or other derived features."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "270fb11e-8a71-404f-9639-ad29d8e6a2c1",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "\n",
-        "f_trip_distance_rounded = DerivedFeature(name=\"f_trip_distance_rounded\",\n",
-        "                                     feature_type=INT32,\n",
-        "                                     input_features=[f_trip_distance],\n",
-        "                                     transform=\"f_trip_distance * 10\")\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "ad102c45-586d-468c-85f0-9454401ef10b",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "And then we need to build those features so that it can be consumed later. Note that we have to build both the \"anchor\" and the \"derived\" features (which is not anchored to a source)."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "91bb5ebb-87e4-470b-b8eb-1c89b351740e",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "client.build_features(anchor_list=[agg_anchor, request_anchor], derived_feature_list=[\n",
-        "                       f_trip_distance_rounded])"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "632d5f46-f9e2-41a8-aab7-34f75206e2aa",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## Create training data using point-in-time correct feature join\n",
-        "\n",
-        "A training dataset usually contains entity id columns, multiple feature columns, event timestamp column and label/target column. \n",
-        "\n",
-        "To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n",
-        "what features and how these features should be joined to the observation data. \n",
-        "\n",
-        "To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "\n",
-        "output_path = 'dbfs:/feathrazure_test.avro'\n",
-        "\n",
-        "\n",
-        "feature_query = FeatureQuery(\n",
-        "    feature_list=[\"f_location_avg_fare\", \"f_trip_distance_rounded\", \"f_is_long_trip_distance\"], key=location_id)\n",
-        "settings = ObservationSettings(\n",
-        "    observation_path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
-        "    event_timestamp_column=\"lpep_dropoff_datetime\",\n",
-        "    timestamp_format=\"yyyy-MM-dd HH:mm:ss\")\n",
-        "client.get_offline_features(observation_settings=settings,\n",
-        "                            feature_query=feature_query,\n",
-        "                            output_path=output_path\n",
-        "                           )\n",
-        "client.wait_job_to_finish(timeout_sec=500)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "51f078e3-3f8f-4f10-b7f1-499ac8a9ff07",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## Download the result and show the result\n",
-        "\n",
-        "Let's use the helper function `get_result_df` to download the result and view it:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "23c797b2-ac1a-4cf3-b0ed-c05216de3f37",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "from feathr.utils.job_utils import get_result_df\n",
-        "df_res = get_result_df(client, format=\"avro\", res_url = output_path)"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "b9be042e-eb12-46b9-9d91-a0e5dd0c704f",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "df_res"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## Train a machine learning model\n",
-        "After getting all the features, let's train a machine learning model with the converted feature by Feathr:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "84745f36-5bac-49c0-903b-38828b923c7c",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "# remove columns\n",
-        "from sklearn.ensemble import GradientBoostingRegressor\n",
-        "final_df = df_res\n",
-        "final_df.drop([\"lpep_pickup_datetime\", \"lpep_dropoff_datetime\",\n",
-        "              \"store_and_fwd_flag\"], axis=1, inplace=True, errors='ignore')\n",
-        "final_df.fillna(0, inplace=True)\n",
-        "final_df['fare_amount'] = final_df['fare_amount'].astype(\"float64\")\n",
-        "\n",
-        "\n",
-        "train_x, test_x, train_y, test_y = train_test_split(final_df.drop([\"fare_amount\"], axis=1),\n",
-        "                                                    final_df[\"fare_amount\"],\n",
-        "                                                    test_size=0.2,\n",
-        "                                                    random_state=42)\n",
-        "model = GradientBoostingRegressor()\n",
-        "model.fit(train_x, train_y)\n",
-        "\n",
-        "y_predict = model.predict(test_x)\n",
-        "\n",
-        "y_actual = test_y.values.flatten().tolist()\n",
-        "rmse = sqrt(mean_squared_error(y_actual, y_predict))\n",
-        "\n",
-        "sum_actuals = sum_errors = 0\n",
-        "\n",
-        "for actual_val, predict_val in zip(y_actual, y_predict):\n",
-        "    abs_error = actual_val - predict_val\n",
-        "    if abs_error < 0:\n",
-        "        abs_error = abs_error * -1\n",
-        "\n",
-        "    sum_errors = sum_errors + abs_error\n",
-        "    sum_actuals = sum_actuals + actual_val\n",
-        "\n",
-        "mean_abs_percent_error = sum_errors / sum_actuals\n",
-        "print(\"Model MAPE:\")\n",
-        "print(mean_abs_percent_error)\n",
-        "print()\n",
-        "print(\"Model Accuracy:\")\n",
-        "print(1 - mean_abs_percent_error)\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "5a226026-1c7b-48db-8f91-88d5c2ddf023",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## Materialize feature value into offline/online storage\n",
-        "\n",
-        "While Feathr can compute the feature value from the feature definition on-the-fly at request time, it can also pre-compute\n",
-        "and materialize the feature value to offline and/or online storage. \n",
-        "\n",
-        "We can push the generated features to the online store like below:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "3b924c66-8634-42fe-90f3-c844487d3f75",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "backfill_time = BackfillTime(start=datetime(\n",
-        "    2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))\n",
-        "redisSink = RedisSink(table_name=\"nycTaxiDemoFeature\")\n",
-        "settings = MaterializationSettings(\"nycTaxiTable\",\n",
-        "                                   backfill_time=backfill_time,\n",
-        "                                   sinks=[redisSink],\n",
-        "                                   feature_names=[\"f_location_avg_fare\", \"f_location_max_fare\"])\n",
-        "\n",
-        "client.materialize_features(settings)\n",
-        "client.wait_job_to_finish(timeout_sec=500)\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "We can then get the features from the online store (Redis):"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "bef93538-9591-4247-97b6-289d2055b7b1",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "source": [
-        "## Fetching feature value for online inference\n",
-        "\n",
-        "For features that are already materialized by the previous step, their latest value can be queried via the client's\n",
-        "`get_online_features` or `multi_get_online_features` API."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "0c3d5f35-11a3-4644-9992-5860169d8302",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "res = client.get_online_features('nycTaxiDemoFeature', '265', [\n",
-        "                                 'f_location_avg_fare', 'f_location_max_fare'])"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "application/vnd.databricks.v1+cell": {
-          "inputWidgets": {},
-          "nuid": "4d4699ed-42e6-408f-903d-2f799284f4b6",
-          "showTitle": false,
-          "title": ""
-        }
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<style scoped>\n",
-              "  .ansiout {\n",
-              "    display: block;\n",
-              "    unicode-bidi: embed;\n",
-              "    white-space: pre-wrap;\n",
-              "    word-wrap: break-word;\n",
-              "    word-break: break-all;\n",
-              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
-              "    font-size: 13px;\n",
-              "    color: #555;\n",
-              "    margin-left: 4px;\n",
-              "    line-height: 19px;\n",
-              "  }\n",
-              "</style>"
-            ]
-          },
-          "metadata": {
-            "application/vnd.databricks.v1+output": {
-              "arguments": {},
-              "data": "",
-              "errorSummary": "",
-              "errorTraceType": null,
-              "metadata": {},
-              "type": "ipynbError"
-            }
-          },
-          "output_type": "display_data"
-        }
-      ],
-      "source": [
-        "client.multi_get_online_features(\"nycTaxiDemoFeature\", [\"239\", \"265\"], [\n",
-        "                                 'f_location_avg_fare', 'f_location_max_fare'])"
-      ]
-    }
-  ],
-  "metadata": {
-    "application/vnd.databricks.v1+notebook": {
-      "dashboards": [],
-      "language": "python",
-      "notebookMetadata": {
-        "pythonIndentUnit": 4
-      },
-      "notebookName": "nyc_driver_demo",
-      "notebookOrigID": 930353059183053,
-      "widgets": {}
-    },
-    "interpreter": {
-      "hash": "830c16c5b424e7ff512f67d4056b67cea1a756a7ad6a92c98b9e2b95c5e484ae"
-    },
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.9.5"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
diff --git a/docs/samples/nyc_taxi_demo.ipynb b/docs/samples/nyc_taxi_demo.ipynb
new file mode 100644
index 000000000..bb41bd2fe
--- /dev/null
+++ b/docs/samples/nyc_taxi_demo.ipynb
@@ -0,0 +1,1110 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "384e5e16-7213-4186-9d04-09d03b155534",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "# Feathr Quick Start Notebook\n",
+    "\n",
+    "This notebook illustrates the use of Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n",
+    "\n",
+    "The major problems Feathr solves are:\n",
+    "\n",
+    "1. Create, share and manage useful features from raw source data.\n",
+    "2. Provide Point-in-time feature join to create training dataset to ensure no data leakage.\n",
+    "3. Deploy the same feature data to online store to eliminate training and inference data skew."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Prerequisite\n",
+    "\n",
+    "Feathr has native cloud integration. First step is to provision required cloud resources if you want to use Feathr.\n",
+    "\n",
+    "Follow the [Feathr ARM deployment guide](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to run Feathr on Azure. This allows you to quickly get started with automated deployment using Azure Resource Manager template. For more details, please refer [README.md](https://github.com/feathr-ai/feathr#%EF%B8%8F-running-feathr-on-cloud-with-a-few-simple-steps).\n",
+    "\n",
+    "Additionally, to run this notebook, you'll need to install `feathr` pip package. For local spark, simply run `pip install feathr` on the machine that runs this notebook. To use Databricks or Azure Synapse Analytics, please see dependency management documents:\n",
+    "- [Azure Databricks dependency management](https://learn.microsoft.com/en-us/azure/databricks/libraries/)\n",
+    "- [Azure Synapse Analytics dependency management](https://learn.microsoft.com/en-us/azure/synapse-analytics/spark/apache-spark-azure-portal-add-libraries)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Notebook Steps\n",
+    "\n",
+    "This tutorial demonstrates the key capabilities of Feathr, including:\n",
+    "\n",
+    "1. Install Feathr and necessary dependencies\n",
+    "2. Create shareable features with Feathr feature definition configs\n",
+    "3. Create training data using point-in-time correct feature join\n",
+    "4. Train a prediction model and evaluate the model and features\n",
+    "5. Register the features to share across teams\n",
+    "6. Materialize feature values for online scoring\n",
+    "\n",
+    "The overall data flow is as follows:\n",
+    "\n",
+    "<img src=\"https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true\" width=\"800\">"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. Install Feathr and Necessary Dependancies\n",
+    "\n",
+    "Install feathr and necessary packages by running `pip install feathr[notebook]` if you haven't installed them already."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%load_ext autoreload\n",
+    "%autoreload 2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "80223a02-631c-40c8-91b3-a037249ffff9",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "from datetime import datetime, timedelta\n",
+    "import glob\n",
+    "import json\n",
+    "from math import sqrt\n",
+    "import os\n",
+    "from pathlib import Path\n",
+    "import requests\n",
+    "from tempfile import TemporaryDirectory\n",
+    "\n",
+    "from azure.identity import AzureCliCredential, DefaultAzureCredential \n",
+    "from azure.keyvault.secrets import SecretClient\n",
+    "import pandas as pd\n",
+    "from pyspark.ml import Pipeline\n",
+    "from pyspark.ml.evaluation import RegressionEvaluator\n",
+    "from pyspark.ml.feature import VectorAssembler\n",
+    "from pyspark.ml.regression import GBTRegressor\n",
+    "from pyspark.sql import DataFrame, SparkSession\n",
+    "import pyspark.sql.functions as F\n",
+    "\n",
+    "import feathr\n",
+    "from feathr import (\n",
+    "    FeathrClient,\n",
+    "    # Feature data types\n",
+    "    BOOLEAN, FLOAT, INT32, ValueType,\n",
+    "    # Feature data sources\n",
+    "    INPUT_CONTEXT, HdfsSource,\n",
+    "    # Feature aggregations\n",
+    "    TypedKey, WindowAggTransformation,\n",
+    "    # Feature types and anchor\n",
+    "    DerivedFeature, Feature, FeatureAnchor,\n",
+    "    # Materialization\n",
+    "    BackfillTime, MaterializationSettings, RedisSink,\n",
+    "    # Offline feature computation\n",
+    "    FeatureQuery, ObservationSettings,\n",
+    ")\n",
+    "from feathr.datasets import nyc_taxi\n",
+    "from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\n",
+    "from feathr.utils.config import generate_config\n",
+    "from feathr.utils.job_utils import get_result_df\n",
+    "from feathr.utils.platform import is_databricks, is_jupyter\n",
+    "\n",
+    "print(f\"Feathr version: {feathr.__version__}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Create Shareable Features with Feathr Feature Definition Configs\n",
+    "\n",
+    "First, we define all the necessary resource key values for authentication. These values are retrieved by using [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) cloud key value store. For authentication, we use Azure CLI credential in this notebook, but you may add secrets' list and get permission for the necessary service principal instead of running `az login --use-device-code`.\n",
+    "\n",
+    "Please refer to [A note on using azure key vault to store credentials](https://github.com/feathr-ai/feathr/blob/41e7496b38c43af6d7f8f1de842f657b27840f6d/docs/how-to-guides/feathr-configuration-and-env.md#a-note-on-using-azure-key-vault-to-store-credentials) for more details."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "tags": [
+     "parameters"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "RESOURCE_PREFIX = None  # TODO fill the value\n",
+    "PROJECT_NAME = \"feathr_getting_started\"\n",
+    "\n",
+    "# Data store root path. Could be a local file system path or Azure storage path like abfs or wasbs\n",
+    "DATA_STORE_PATH = TemporaryDirectory().name\n",
+    "\n",
+    "# Currently support: 'azure_synapse', 'databricks', and 'local' \n",
+    "SPARK_CLUSTER = \"local\"\n",
+    "# TODO -- Synapse spark pool name or Databricks cluster id\n",
+    "CLUSTER_NAME = None\n",
+    "\n",
+    "# If set True, use an interactive browser authentication\n",
+    "USE_CLI_AUTH = False\n",
+    "\n",
+    "# (For the notebook test pipeline) If true, use ScrapBook package to collect the results.\n",
+    "SCRAP_RESULTS = False"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "KEY_VAULT = f\"{RESOURCE_PREFIX}kv\"\n",
+    "KEY_VAULT_URI = f\"https://{KEY_VAULT}.vault.azure.net\"\n",
+    "\n",
+    "ADLS_PATH = f\"abfss://{RESOURCE_PREFIX}fs@{RESOURCE_PREFIX}dls.dfs.core.windows.net/feathr_project\"\n",
+    "\n",
+    "if SPARK_CLUSTER == \"azure_synapse\":\n",
+    "    os.environ['spark_config__azure_synapse__dev_url'] = f\"https://{resource_prefix}syws.dev.azuresynapse.net\"\n",
+    "    os.environ['spark_config__azure_synapse__pool_name'] = CLUSTER_NAME\n",
+    "    os.environ['spark_config__azure_synapse__workspace_dir'] = f\"abfss://{adls_fs_name}@{resource_prefix}dls.dfs.core.windows.net/{PROJECT_NAME}\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if USE_CLI_AUTH:\n",
+    "    !az login --use-device-code"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "# Get all the required credentials from Azure Key Vault\n",
+    "credential = AzureCliCredential() if USE_CLI_AUTH else DefaultAzureCredential()\n",
+    "secret_client = SecretClient(vault_url=KEY_VAULT_URI, credential=credential)\n",
+    "retrieved_secret = secret_client.get_secret('FEATHR-ONLINE-STORE-CONN').value"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Redis credential\n",
+    "os.environ['REDIS_PASSWORD'] = retrieved_secret.split(\",\")[1].split(\"password=\", 1)[1]\n",
+    "\n",
+    "if SPARK_CLUSTER == \"local\":\n",
+    "    os.environ['SPARK_LOCAL_IP'] = \"127.0.0.1\"\n",
+    "\n",
+    "elif SPARK_CLUSTER == \"databricks\" and is_databricks():\n",
+    "    ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n",
+    "    databricks_config = {\n",
+    "        'run_name': \"FEATHR_FILL_IN\",\n",
+    "        'existing_cluster_id': ctx.tags().get('clusterId').get(),\n",
+    "        'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n",
+    "        'spark_jar_task': {\n",
+    "            'main_class_name': \"FEATHR_FILL_IN\",\n",
+    "            'parameters': [\"FEATHR_FILL_IN\"],\n",
+    "        },\n",
+    "    }\n",
+    "    os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\n",
+    "    os.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\n",
+    "    os.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\n",
+    "    os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "41d3648a-9bc9-40dc-90da-bc82b21ef9b3",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "### Configurations\n",
+    "\n",
+    "Feathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "8cd64e3a-376c-48e6-ba41-5197f3591d48",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n",
+    "\n",
+    "with open(config_path, 'r') as f: \n",
+    "    print(f.read())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "3fef7f2f-df19-4f53-90a5-ff7999ed983d",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "### Initialize Feathr client"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "9713a2df-c7b2-4562-88b0-b7acce3cc43a",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "client = FeathrClient(config_path=config_path)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "c3b64bda-d42c-4a64-b976-0fb604cf38c5",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "### Prepare the NYC taxi fare dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# To run on a local spark, start a spark session:\n",
+    "if SPARK_CLUSTER == \"local\":\n",
+    "    spark = (\n",
+    "        SparkSession\n",
+    "        .builder\n",
+    "        .appName(\"feathr\")\n",
+    "        .config(\"spark.jars.packages\", \"org.apache.spark:spark-avro_2.12:3.3.0\")\n",
+    "        .config(\"spark.ui.port\", \"8080\")  # Set ui port other than the default one (4040) so that feathr spark job doesn't fail. \n",
+    "        .getOrCreate()\n",
+    "    )\n",
+    "    \n",
+    "# Else, you must already have spark session object available in databricks or synapse."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "c4ccd7b3-298a-4e5a-8eec-b7e309db393e",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n",
+    "\n",
+    "# Download the data file\n",
+    "df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\n",
+    "df_raw.limit(5).toPandas()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "7430c942-64e5-4b70-b823-16ce1d1b3cee",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "### Defining features with Feathr\n",
+    "\n",
+    "In Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n",
+    "\n",
+    "* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n",
+    "* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n",
+    "* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n",
+    "\n",
+    "Note that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n",
+    "\n",
+    "There are two types of features -- anchored features and derivated features:\n",
+    "\n",
+    "* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n",
+    "* **Derived features**: Features that are computed on top of other features.\n",
+    "\n",
+    "#### Define anchored features\n",
+    "\n",
+    "A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "TIMESTAMP_COL = \"lpep_dropoff_datetime\"\n",
+    "TIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "a373ecbe-a040-4cd3-9d87-0d5f4c5ba553",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "# We define f_trip_distance and f_trip_time_duration features separately\n",
+    "# so that we can reuse them later for the derived features.\n",
+    "f_trip_distance = Feature(\n",
+    "    name=\"f_trip_distance\",\n",
+    "    feature_type=FLOAT,\n",
+    "    transform=\"trip_distance\",\n",
+    ")\n",
+    "f_trip_time_duration = Feature(\n",
+    "    name=\"f_trip_time_duration\",\n",
+    "    feature_type=FLOAT,\n",
+    "    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n",
+    ")\n",
+    "\n",
+    "features = [\n",
+    "    f_trip_distance,\n",
+    "    f_trip_time_duration,\n",
+    "    Feature(\n",
+    "        name=\"f_is_long_trip_distance\",\n",
+    "        feature_type=BOOLEAN,\n",
+    "        transform=\"trip_distance > 30.0\",\n",
+    "    ),\n",
+    "    Feature(\n",
+    "        name=\"f_day_of_week\",\n",
+    "        feature_type=INT32,\n",
+    "        transform=\"dayofweek(lpep_dropoff_datetime)\",\n",
+    "    ),\n",
+    "    Feature(\n",
+    "        name=\"f_day_of_month\",\n",
+    "        feature_type=INT32,\n",
+    "        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n",
+    "    ),\n",
+    "    Feature(\n",
+    "        name=\"f_hour_of_day\",\n",
+    "        feature_type=INT32,\n",
+    "        transform=\"hour(lpep_dropoff_datetime)\",\n",
+    "    ),\n",
+    "]\n",
+    "\n",
+    "# After you have defined features, bring them together to build the anchor to the source.\n",
+    "feature_anchor = FeatureAnchor(\n",
+    "    name=\"feature_anchor\",\n",
+    "    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n",
+    "    features=features,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can define the source with a preprocessing python function."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def preprocessing(df: DataFrame) -> DataFrame:\n",
+    "    import pyspark.sql.functions as F\n",
+    "    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n",
+    "    return df\n",
+    "\n",
+    "batch_source = HdfsSource(\n",
+    "    name=\"nycTaxiBatchSource\",\n",
+    "    path=DATA_FILE_PATH,\n",
+    "    event_timestamp_column=TIMESTAMP_COL,\n",
+    "    preprocessing=preprocessing,\n",
+    "    timestamp_format=TIMESTAMP_FORMAT,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "For the features with aggregation, the supported functions are as follows:\n",
+    "\n",
+    "| Aggregation Function | Input Type | Description |\n",
+    "| --- | --- | --- |\n",
+    "|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n",
+    "|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n",
+    "|LATEST| Any |Returns the latest not-null values from within the defined time window |"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "agg_key = TypedKey(\n",
+    "    key_column=\"DOLocationID\",\n",
+    "    key_column_type=ValueType.INT32,\n",
+    "    description=\"location id in NYC\",\n",
+    "    full_name=\"nyc_taxi.location_id\",\n",
+    ")\n",
+    "\n",
+    "agg_window = \"90d\"\n",
+    "\n",
+    "# Anchored features with aggregations\n",
+    "agg_features = [\n",
+    "    Feature(\n",
+    "        name=\"f_location_avg_fare\",\n",
+    "        key=agg_key,\n",
+    "        feature_type=FLOAT,\n",
+    "        transform=WindowAggTransformation(\n",
+    "            agg_expr=\"fare_amount_cents\",\n",
+    "            agg_func=\"AVG\",\n",
+    "            window=agg_window,\n",
+    "        ),\n",
+    "    ),\n",
+    "    Feature(\n",
+    "        name=\"f_location_max_fare\",\n",
+    "        key=agg_key,\n",
+    "        feature_type=FLOAT,\n",
+    "        transform=WindowAggTransformation(\n",
+    "            agg_expr=\"fare_amount_cents\",\n",
+    "            agg_func=\"MAX\",\n",
+    "            window=agg_window,\n",
+    "        ),\n",
+    "    ),\n",
+    "]\n",
+    "\n",
+    "agg_feature_anchor = FeatureAnchor(\n",
+    "    name=\"agg_feature_anchor\",\n",
+    "    source=batch_source,  # External data source for feature. Typically a data table.\n",
+    "    features=agg_features,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "d2ecaca9-057e-4b36-811f-320f66f753ed",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "#### Define derived features\n",
+    "\n",
+    "We also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "270fb11e-8a71-404f-9639-ad29d8e6a2c1",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "derived_features = [\n",
+    "    DerivedFeature(\n",
+    "        name=\"f_trip_time_distance\",\n",
+    "        feature_type=FLOAT,\n",
+    "        input_features=[\n",
+    "            f_trip_distance,\n",
+    "            f_trip_time_duration,\n",
+    "        ],\n",
+    "        transform=\"f_trip_distance / f_trip_time_duration\",\n",
+    "    )\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "ad102c45-586d-468c-85f0-9454401ef10b",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "### Build features\n",
+    "\n",
+    "Finally, we build the features."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "91bb5ebb-87e4-470b-b8eb-1c89b351740e",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "outputs": [],
+   "source": [
+    "client.build_features(\n",
+    "    anchor_list=[feature_anchor, agg_feature_anchor],\n",
+    "    derived_feature_list=derived_features,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "632d5f46-f9e2-41a8-aab7-34f75206e2aa",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "## 3. Create Training Data Using Point-in-Time Correct Feature Join\n",
+    "\n",
+    "After the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n",
+    "\n",
+    "To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n",
+    "what features and how these features should be joined to the observation data. \n",
+    "\n",
+    "To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "feature_names = [feature.name for feature in features + agg_features + derived_features]\n",
+    "feature_names"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "DATA_FORMAT = \"parquet\"\n",
+    "offline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f",
+     "showTitle": false,
+     "title": ""
+    },
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "# Features that we want to request. Can use a subset of features\n",
+    "query = FeatureQuery(\n",
+    "    feature_list=feature_names,\n",
+    "    key=agg_key,\n",
+    ")\n",
+    "settings = ObservationSettings(\n",
+    "    observation_path=DATA_FILE_PATH,\n",
+    "    event_timestamp_column=TIMESTAMP_COL,\n",
+    "    timestamp_format=TIMESTAMP_FORMAT,\n",
+    ")\n",
+    "client.get_offline_features(\n",
+    "    observation_settings=settings,\n",
+    "    feature_query=query,\n",
+    "    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n",
+    "    execution_configurations=SparkExecutionConfiguration({\n",
+    "        \"spark.feathr.outputFormat\": DATA_FORMAT,\n",
+    "    }),\n",
+    "    output_path=offline_features_path,\n",
+    ")\n",
+    "\n",
+    "client.wait_job_to_finish(timeout_sec=500)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Show feature results\n",
+    "df = get_result_df(\n",
+    "    spark=spark,\n",
+    "    client=client,\n",
+    "    data_format=DATA_FORMAT,\n",
+    "    res_url=offline_features_path,\n",
+    ")\n",
+    "df.select(feature_names).limit(5).toPandas()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "## 4. Train a Prediction Model and Evaluate the Features\n",
+    "\n",
+    "After generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n",
+    "\n",
+    "Note that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Load Train and Test Data from the Offline Feature Values"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Train / test split\n",
+    "train_df, test_df = (\n",
+    "    df  # Dataframe that we generated from get_offline_features call.\n",
+    "    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n",
+    "    .where(F.col(\"f_trip_time_duration\") > 0)\n",
+    "    .fillna(0)\n",
+    "    .randomSplit([0.8, 0.2])\n",
+    ")\n",
+    "\n",
+    "print(f\"Num train samples: {train_df.count()}\")\n",
+    "print(f\"Num test samples: {test_df.count()}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Build a ML Pipeline\n",
+    "\n",
+    "Here, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Generate a feature vector column for SparkML\n",
+    "vector_assembler = VectorAssembler(\n",
+    "    inputCols=[x for x in df.columns if x in feature_names],\n",
+    "    outputCol=\"features\",\n",
+    ")\n",
+    "\n",
+    "# Define a model\n",
+    "gbt = GBTRegressor(\n",
+    "    featuresCol=\"features\",\n",
+    "    maxIter=100,\n",
+    "    maxDepth=5,\n",
+    "    maxBins=16,\n",
+    ")\n",
+    "\n",
+    "# Create a ML pipeline\n",
+    "ml_pipeline = Pipeline(stages=[\n",
+    "    vector_assembler,\n",
+    "    gbt,\n",
+    "])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Train and Evaluate the Model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Train a model\n",
+    "model = ml_pipeline.fit(train_df)\n",
+    "\n",
+    "# Make predictions\n",
+    "predictions = model.transform(test_df)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Evaluate\n",
+    "evaluator = RegressionEvaluator(\n",
+    "    labelCol=\"label\",\n",
+    "    predictionCol=\"prediction\",\n",
+    ")\n",
+    "\n",
+    "rmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\n",
+    "mae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\n",
+    "print(f\"RMSE: {rmse}\\nMAE: {mae}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\n",
+    "predictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n",
+    "\n",
+    "predictions_pdf.plot(\n",
+    "    x=\"index\",\n",
+    "    y=[\"label\", \"prediction\"],\n",
+    "    style=['-', ':'],\n",
+    "    figsize=(20, 10),\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "predictions_pdf.plot.scatter(\n",
+    "    x=\"label\",\n",
+    "    y=\"prediction\",\n",
+    "    xlim=(0, 100),\n",
+    "    ylim=(0, 100),\n",
+    "    figsize=(10, 10),\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 5. Register the Features to Share Across Teams\n",
+    "\n",
+    "You can register your features in the centralized registry and share the corresponding project with other team members who want to consume those features and for further use."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "try:\n",
+    "    client.register_features()\n",
+    "except KeyError:\n",
+    "    # TODO temporarily go around the \"Already exists\" error\n",
+    "    \n",
+    "    client.list_registered_features(project_name=PROJECT_NAME)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "5a226026-1c7b-48db-8f91-88d5c2ddf023",
+     "showTitle": false,
+     "title": ""
+    }
+   },
+   "source": [
+    "## 6. Materialize Feature Values for Online Scoring\n",
+    "\n",
+    "While we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n",
+    "\n",
+    "Note, only the features anchored to offline data source can be materialized."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get registered features\n",
+    "registered_features_dict = client.get_features_from_registry(PROJECT_NAME)\n",
+    "\n",
+    "observation_feature_names = []\n",
+    "materialized_feature_names = []\n",
+    "\n",
+    "for feature_name, feature in registered_features_dict.items():\n",
+    "    if feature.key[0].key_column == \"NOT_NEEDED\":\n",
+    "        observation_feature_names.append(feature_name)\n",
+    "    else:\n",
+    "        materialized_feature_names.append(feature_name)\n",
+    "        \n",
+    "print(f\"Features that will be extracted directly from the observation: {observation_feature_names}\")\n",
+    "print(\"\")\n",
+    "print(f\"Features that will be extracted from the source data and materialized to online storage: {materialized_feature_names}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the last date from the dataset\n",
+    "backfill_timestamp = (\n",
+    "    df_raw\n",
+    "    .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n",
+    "    .agg({TIMESTAMP_COL: \"max\"})\n",
+    "    .collect()[0][0]\n",
+    ")\n",
+    "backfill_timestamp"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "application/vnd.databricks.v1+cell": {
+     "inputWidgets": {},
+     "nuid": "3b924c66-8634-42fe-90f3-c844487d3f75",
+     "showTitle": false,
+     "title": ""
+    },
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n",
+    "\n",
+    "# Time range to materialize\n",
+    "backfill_time = BackfillTime(\n",
+    "    start=backfill_timestamp,\n",
+    "    end=backfill_timestamp,\n",
+    "    step=timedelta(days=1),\n",
+    ")\n",
+    "\n",
+    "# Destinations:\n",
+    "# For online store,\n",
+    "redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n",
+    "\n",
+    "# For offline store,\n",
+    "# adls_sink = HdfsSink(output_path=)\n",
+    "\n",
+    "settings = MaterializationSettings(\n",
+    "    name=FEATURE_TABLE_NAME + \".job\",  # job name\n",
+    "    backfill_time=backfill_time,\n",
+    "    sinks=[redis_sink],  # or adls_sink\n",
+    "    feature_names=materialized_feature_names,\n",
+    ")\n",
+    "\n",
+    "client.materialize_features(\n",
+    "    settings=settings,\n",
+    "    execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n",
+    ")\n",
+    "\n",
+    "client.wait_job_to_finish(timeout_sec=500)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now, you can retrieve features for online scoring as follows:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Note, to get a single key, you may use client.get_online_features instead\n",
+    "materialized_feature_values = client.multi_get_online_features(\n",
+    "    feature_table=FEATURE_TABLE_NAME,\n",
+    "    keys=[\"239\", \"265\"],\n",
+    "    feature_names=materialized_feature_names,\n",
+    ")\n",
+    "materialized_feature_values"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Cleanup"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# TODO: Unregister or any other cleanups."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Stop the spark session if it is a local session.\n",
+    "if is_jupyter():\n",
+    "    spark.stop()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Scrap Variables for Testing"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if SCRAP_RESULTS:\n",
+    "    # Record results for test pipelines\n",
+    "    import scrapbook as sb\n",
+    "    sb.glue(\"materialized_feature_values\", materialized_feature_values)\n",
+    "    sb.glue(\"rmse\", rmse)\n",
+    "    sb.glue(\"mae\", mae)"
+   ]
+  }
+ ],
+ "metadata": {
+  "application/vnd.databricks.v1+notebook": {
+   "dashboards": [],
+   "language": "python",
+   "notebookMetadata": {
+    "pythonIndentUnit": 4
+   },
+   "notebookName": "nyc_driver_demo",
+   "notebookOrigID": 930353059183053,
+   "widgets": {}
+  },
+  "celltoolbar": "Tags",
+  "kernelspec": {
+   "display_name": "Python 3.10.4 ('feathr')",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.4"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "ddb0e38f168d5afaa0b8ab4851ddd8c14364f1d087c15de6ff2ee5a559aec1f2"
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
diff --git a/feathr_project/feathr/client.py b/feathr_project/feathr/client.py
index b14bf868e..dd39a70fa 100644
--- a/feathr_project/feathr/client.py
+++ b/feathr_project/feathr/client.py
@@ -486,7 +486,7 @@ def _get_offline_features_with_config(self,
         job_tags = {OUTPUT_PATH_TAG:feature_join_job_params.job_output_path}
         # set output format in job tags if it's set by user, so that it can be used to parse the job result in the helper function
         if execution_configurations is not None and OUTPUT_FORMAT in execution_configurations:
-            job_tags[OUTPUT_FORMAT]= execution_configurations[OUTPUT_FORMAT]
+            job_tags[OUTPUT_FORMAT] = execution_configurations[OUTPUT_FORMAT]
         '''
         - Job tags are for job metadata and it's not passed to the actual spark job (i.e. not visible to spark job), more like a platform related thing that Feathr want to add (currently job tags only have job output URL and job output format, ). They are carried over with the job and is visible to every Feathr client. Think this more like some customized metadata for the job which would be weird to be put in the spark job itself.
         - Job arguments (or sometimes called job parameters)are the arguments which are command line arguments passed into the actual spark job. This is usually highly related with the spark job. In Feathr it's like the input to the scala spark CLI. They are usually not spark specific (for example if we want to specify the location of the feature files, or want to
diff --git a/feathr_project/feathr/datasets/__init__.py b/feathr_project/feathr/datasets/__init__.py
new file mode 100644
index 000000000..a1e2e5bf3
--- /dev/null
+++ b/feathr_project/feathr/datasets/__init__.py
@@ -0,0 +1,9 @@
+"""Utilities for downloading sample datasets"""
+
+from feathr.datasets.constants import (
+    NYC_TAXI_SMALL_URL
+)
+
+__all__ = [
+    "NYC_TAXI_SMALL_URL",
+]
diff --git a/feathr_project/feathr/datasets/constants.py b/feathr_project/feathr/datasets/constants.py
new file mode 100644
index 000000000..849865570
--- /dev/null
+++ b/feathr_project/feathr/datasets/constants.py
@@ -0,0 +1,3 @@
+NYC_TAXI_SMALL_URL = (
+    "https://azurefeathrstorage.blob.core.windows.net/public/sample_data/green_tripdata_2020-04_with_index.csv"
+)
diff --git a/feathr_project/feathr/datasets/nyc_taxi.py b/feathr_project/feathr/datasets/nyc_taxi.py
new file mode 100644
index 000000000..ec605aae6
--- /dev/null
+++ b/feathr_project/feathr/datasets/nyc_taxi.py
@@ -0,0 +1,87 @@
+from pathlib import Path
+from tempfile import TemporaryDirectory
+from threading import local
+from urllib.parse import urlparse
+
+import pandas as pd
+from pyspark.sql import DataFrame, SparkSession
+
+from feathr.datasets import NYC_TAXI_SMALL_URL
+from feathr.datasets.utils import maybe_download
+from feathr.utils.platform import is_databricks
+
+
+def get_pandas_df(
+    local_cache_path: str = None,
+) -> pd.DataFrame:
+    """Get NYC taxi fare prediction data samples as a pandas DataFrame.
+
+    Refs:
+        https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page
+
+    Args:
+        local_cache_path (optional): Local cache file path to download the data set.
+            If local_cache_path is a directory, the source file name will be added.
+
+    Returns:
+        pandas DataFrame
+    """
+    # if local_cache_path params is not provided then create a temporary folder
+    if local_cache_path is None:
+        local_cache_path = TemporaryDirectory().name
+
+    # If local_cache_path is a directory, add the source file name.
+    src_filepath = Path(urlparse(NYC_TAXI_SMALL_URL).path)
+    dst_path = Path(local_cache_path)
+    if dst_path.suffix != src_filepath.suffix:
+        local_cache_path = str(dst_path.joinpath(src_filepath.name))
+
+    maybe_download(src_url=NYC_TAXI_SMALL_URL, dst_filepath=local_cache_path)
+
+    pdf = pd.read_csv(local_cache_path)
+
+    return pdf
+
+
+def get_spark_df(
+    spark: SparkSession,
+    local_cache_path: str,
+) -> DataFrame:
+    """Get NYC taxi fare prediction data samples as a spark DataFrame.
+
+    Refs:
+        https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page
+
+    Args:
+        spark: Spark session.
+        local_cache_path: Local cache file path to download the data set.
+            If local_cache_path is a directory, the source file name will be added.
+
+    Returns:
+        Spark DataFrame
+    """
+    # In spark, local_cache_path should be a persist directory or file path
+    if local_cache_path is None:
+        raise ValueError("In spark, `local_cache_path` should be a persist directory or file path.")
+
+    # If local_cache_path is a directory, add the source file name.
+    src_filepath = Path(urlparse(NYC_TAXI_SMALL_URL).path)
+    dst_path = Path(local_cache_path)
+    if dst_path.suffix != src_filepath.suffix:
+        local_cache_path = str(dst_path.joinpath(src_filepath.name))
+
+    if is_databricks():
+        # Databricks uses "dbfs:/" prefix for spark paths
+        if not local_cache_path.startswith("dbfs:"):
+            local_cache_path = str(Path("dbfs:", local_cache_path.lstrip("/")))
+        # Databricks uses "/dbfs/" prefix for python paths
+        python_local_cache_path = local_cache_path.replace("dbfs:", "/dbfs")
+    # TODO add "if is_synapse()"
+    else:
+        python_local_cache_path = local_cache_path
+
+    maybe_download(src_url=NYC_TAXI_SMALL_URL, dst_filepath=python_local_cache_path)
+
+    df = spark.read.option("header", True).csv(local_cache_path)
+
+    return df
diff --git a/feathr_project/feathr/datasets/utils.py b/feathr_project/feathr/datasets/utils.py
new file mode 100644
index 000000000..5dcfb6e87
--- /dev/null
+++ b/feathr_project/feathr/datasets/utils.py
@@ -0,0 +1,64 @@
+"""Dataset utilities
+"""
+import logging
+import math
+from pathlib import Path
+import requests
+from urllib.parse import urlparse
+
+from tqdm import tqdm
+
+
+log = logging.getLogger(__name__)
+
+
+def maybe_download(src_url: str, dst_filepath: str, expected_bytes=None) -> bool:
+    """Check if file exists. If not, download and return True. Else, return False.
+
+    Refs:
+        https://github.com/microsoft/recommenders/blob/main/recommenders/datasets/download_utils.py
+
+    Args:
+        src_url: Source file URL.
+        dst_filepath: Destination file path.
+        expected_bytes (optional): Expected bytes of the file to verify.
+
+    Returns:
+        bool: Whether the file was downloaded or not
+    """
+    dst_filepath = Path(dst_filepath)
+
+    if dst_filepath.is_file():
+        log.info(f"File {str(dst_filepath)} already exists")
+        return False
+
+    # Check dir if exists. If not, create one
+    dst_filepath.parent.mkdir(parents=True, exist_ok=True)
+
+    response = requests.get(src_url, stream=True)
+    if response.status_code == 200:
+        log.info(f"Downloading {src_url}")
+        total_size = int(response.headers.get("content-length", 0))
+        block_size = 1024
+        num_iterables = math.ceil(total_size / block_size)
+        with open(str(dst_filepath.resolve()), "wb") as file:
+            for data in tqdm(
+                response.iter_content(block_size),
+                total=num_iterables,
+                unit="KB",
+                unit_scale=True,
+            ):
+                file.write(data)
+
+        # Verify the file size
+        if expected_bytes is not None and expected_bytes != dst_filepath.stat().st_size:
+            # Delete the file since the size is not the same as the expected one.
+            dst_filepath.unlink()
+            raise IOError(f"Failed to verify {str(dst_filepath)}. Maybe interrupted while downloading?")
+        else:
+            return True
+
+    else:
+        response.raise_for_status()
+        # If not HTTPError yet still cannot download
+        raise Exception(f"Problem downloading {src_url}")
diff --git a/feathr_project/feathr/spark_provider/_databricks_submission.py b/feathr_project/feathr/spark_provider/_databricks_submission.py
index cfff0180e..cc587e999 100644
--- a/feathr_project/feathr/spark_provider/_databricks_submission.py
+++ b/feathr_project/feathr/spark_provider/_databricks_submission.py
@@ -1,67 +1,65 @@
-from ast import Raise
+from collections import namedtuple
 import copy
 import json
 import os
-import time
-from collections import namedtuple
 from os.path import basename
 from pathlib import Path
-from typing import Any, Dict, List, Optional, Union
+import time
+from typing import Dict, List, Optional, Union
 from urllib.parse import urlparse
 from urllib.request import urlopen
 
-import requests
 from databricks_cli.dbfs.api import DbfsApi
 from databricks_cli.runs.api import RunsApi
 from databricks_cli.sdk.api_client import ApiClient
-from feathr.constants import *
-from feathr.spark_provider._abc import SparkJobLauncher
 from loguru import logger
+import requests
 from requests.structures import CaseInsensitiveDict
 
+from feathr.constants import *
+from feathr.spark_provider._abc import SparkJobLauncher
+
 
 class _FeathrDatabricksJobLauncher(SparkJobLauncher):
     """Class to interact with Databricks Spark cluster
-        This is a light-weight databricks job runner, users should use the provided template json string to get more fine controlled environment for databricks cluster.
-        For example, user can control whether to use a new cluster to run the job or not, specify the cluster ID, running frequency, node size, workder no., whether to send out failed notification email, etc.
-        This runner will only fill in necessary arguments in the JSON template.
-
-        This class will read from the provided configs string, and do the following steps.
-        This default template can be overwritten by users, but users need to make sure the template is compatible with the default template. Specifically:
-        1. it's a SparkJarTask (rather than other types of jobs, say NotebookTask or others). See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details
-        2. Use the Feathr Jar to run the job (hence will add an entry in `libraries` section)
-        3. Only supports `new_cluster` type for now
-        4. Will override `main_class_name` and `parameters` field in the JSON template `spark_jar_task` field
-        5. will override the name of this job
+    This is a light-weight databricks job runner, users should use the provided template json string to get more fine controlled environment for databricks cluster.
+    For example, user can control whether to use a new cluster to run the job or not, specify the cluster ID, running frequency, node size, workder no., whether to send out failed notification email, etc.
+    This runner will only fill in necessary arguments in the JSON template.
+
+    This class will read from the provided configs string, and do the following steps.
+    This default template can be overwritten by users, but users need to make sure the template is compatible with the default template. Specifically:
+    1. it's a SparkJarTask (rather than other types of jobs, say NotebookTask or others). See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details
+    2. Use the Feathr Jar to run the job (hence will add an entry in `libraries` section)
+    3. Will override `main_class_name` and `parameters` field in the JSON template `spark_jar_task` field
+    4. will override the name of this job
+
+    Args:
+        workspace_instance_url (str): the workinstance url. Document to get workspace_instance_url: https://docs.microsoft.com/en-us/azure/databricks/workspace/workspace-details#workspace-url
+        token_value (str): see here on how to get tokens: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/authentication
+        config_template (str): config template for databricks cluster. See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details.
+        databricks_work_dir (_type_, optional): databricks_work_dir must start with dbfs:/. Defaults to 'dbfs:/feathr_jobs'.
+    """
 
-        Args:
-            workspace_instance_url (str): the workinstance url. Document to get workspace_instance_url: https://docs.microsoft.com/en-us/azure/databricks/workspace/workspace-details#workspace-url
-            token_value (str): see here on how to get tokens: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/authentication
-            config_template (str): config template for databricks cluster. See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details.
-            databricks_work_dir (_type_, optional): databricks_work_dir must start with dbfs:/. Defaults to 'dbfs:/feathr_jobs'.
-        """
     def __init__(
-            self,
-            workspace_instance_url: str,
-            token_value: str,
-            config_template: Union[str,Dict],
-            databricks_work_dir: str = 'dbfs:/feathr_jobs',
+        self,
+        workspace_instance_url: str,
+        token_value: str,
+        config_template: Union[str, Dict],
+        databricks_work_dir: str = "dbfs:/feathr_jobs",
     ):
-
-
         # Below we will use Databricks job APIs (as well as many other APIs) to submit jobs or transfer files
         # For Job APIs, see https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs
         # for DBFS APIs, see: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/dbfs
         self.config_template = config_template
         # remove possible trailing '/' due to wrong input format
-        self.workspace_instance_url = workspace_instance_url.rstrip('/')
+        self.workspace_instance_url = workspace_instance_url.rstrip("/")
         self.auth_headers = CaseInsensitiveDict()
 
         # Authenticate the REST APIs. Documentation: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/authentication
-        self.auth_headers['Accept'] = 'application/json'
-        self.auth_headers['Authorization'] = f'Bearer {token_value}'
+        self.auth_headers["Accept"] = "application/json"
+        self.auth_headers["Authorization"] = f"Bearer {token_value}"
         self.databricks_work_dir = databricks_work_dir
-        self.api_client = ApiClient(host=self.workspace_instance_url,token=token_value)
+        self.api_client = ApiClient(host=self.workspace_instance_url, token=token_value)
 
     def upload_or_get_cloud_path(self, local_path_or_http_path: str):
         """
@@ -77,7 +75,7 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
             with urlopen(local_path_or_http_path) as f:
                 # use REST API to avoid local temp file
                 data = f.read()
-                files = {'file': data}
+                files = {"file": data}
                 # for DBFS APIs, see: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/dbfs
                 r = requests.post(url=self.workspace_instance_url+'/api/2.0/dbfs/put',
                                   headers=self.auth_headers, files=files,  data={'overwrite': 'true', 'path': cloud_dest_path})
@@ -90,8 +88,12 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
             cloud_dest_path = local_path_or_http_path
         elif src_parse_result.scheme.startswith(('wasb','s3','gs')):
             # if the path starts with a location that's not a local path
-            logger.error("File {} cannot be downloaded. Please upload the file to dbfs manually.", local_path_or_http_path)
-            raise RuntimeError(f"File {local_path_or_http_path} cannot be downloaded. Please upload the file to dbfs manually.")
+            logger.error(
+                "File {} cannot be downloaded. Please upload the file to dbfs manually.", local_path_or_http_path
+            )
+            raise RuntimeError(
+                f"File {local_path_or_http_path} cannot be downloaded. Please upload the file to dbfs manually."
+            )
         else:
             # else it should be a local file path or dir
             if os.path.isdir(local_path_or_http_path):
@@ -122,7 +124,18 @@ def _upload_local_file_to_workspace(self, local_path: str) -> str:
             raise RuntimeError(f"The source path: {local_path}, or the destination path: {cloud_dest_path}, is/are not valid.") from e
         return cloud_dest_path
 
-    def submit_feathr_job(self, job_name: str, main_jar_path: str,  main_class_name: str, arguments: List[str], python_files: List[str], reference_files_path: List[str] = [], job_tags: Dict[str, str] = None, configuration: Dict[str, str] = {}, properties: Dict[str, str] = {}):
+    def submit_feathr_job(
+        self,
+        job_name: str,
+        main_jar_path: str,
+        main_class_name: str,
+        arguments: List[str],
+        python_files: List[str],
+        reference_files_path: List[str] = [],
+        job_tags: Dict[str, str] = None,
+        configuration: Dict[str, str] = {},
+        properties: Dict[str, str] = {},
+    ):
         """
         submit the feathr job to databricks
         Refer to the databricks doc for more details on the meaning of the parameters:
@@ -146,72 +159,93 @@ def submit_feathr_job(self, job_name: str, main_jar_path: str,  main_class_name:
             # otherwise users might have missed the quotes in the config. Treat them as dict
             # Note that we need to use deep copy here, in order to make `self.config_template` immutable
             # Otherwise, since we need to change submission_params later, which will modify `self.config_template` and cause unexpected behaviors
-            submission_params = copy.deepcopy(self.config_template) 
-
-        submission_params['run_name'] = job_name
-        if 'existing_cluster_id' not in submission_params:
+            submission_params = copy.deepcopy(self.config_template)
+
+        submission_params["run_name"] = job_name
+        cfg = configuration.copy()
+        if "existing_cluster_id" in submission_params:
+            logger.info("Using an existing general purpose cluster to run the feathr job...")
+            if cfg:
+                logger.warning(
+                    "Spark execution configuration will be ignored. To use job-specific spark configs, please use a new job cluster or set the configs via Databricks UI."
+                )
+            if job_tags:
+                logger.warning(
+                    "Job tags will be ignored. To assign job tags to the cluster, please use a new job cluster."
+                )
+        elif "new_cluster" in submission_params:
+            logger.info("Using a new job cluster to run the feathr job...")
             # if users don't specify existing_cluster_id
             # Solving this issue: Handshake fails trying to connect from Azure Databricks to Azure PostgreSQL with SSL
             # https://docs.microsoft.com/en-us/answers/questions/170730/handshake-fails-trying-to-connect-from-azure-datab.html
-            configuration['spark.executor.extraJavaOptions'] = '-Djava.security.properties='
-            configuration['spark.driver.extraJavaOptions'] = '-Djava.security.properties='
-            submission_params['new_cluster']['spark_conf'] = configuration
+            cfg["spark.executor.extraJavaOptions"] = "-Djava.security.properties="
+            cfg["spark.driver.extraJavaOptions"] = "-Djava.security.properties="
+            submission_params["new_cluster"]["spark_conf"] = cfg
 
             if job_tags:
-                custom_tags = submission_params['new_cluster'].get('custom_tags', {})
+                custom_tags = submission_params["new_cluster"].get("custom_tags", {})
                 for tag, value in job_tags.items():
                     custom_tags[tag] = value
 
-                submission_params['new_cluster']['custom_tags'] = custom_tags
+                submission_params["new_cluster"]["custom_tags"] = custom_tags
+        else:
+            # TODO we should fail fast -- maybe check this in config verification while initializing the client.
+            raise ValueError(
+                "No cluster specifications are found. Either 'existing_cluster_id' or 'new_cluster' should be configured via feathr config."
+            )
 
         # the feathr main jar file is anyway needed regardless it's pyspark or scala spark
         if not main_jar_path:
             logger.info(f"Main JAR file is not set, using default package '{FEATHR_MAVEN_ARTIFACT}' from Maven")
-            submission_params['libraries'][0]['maven'] = { "coordinates": FEATHR_MAVEN_ARTIFACT }
+            submission_params["libraries"][0]["maven"] = {"coordinates": FEATHR_MAVEN_ARTIFACT}
         else:
-            submission_params['libraries'][0]['jar'] = self.upload_or_get_cloud_path(main_jar_path)
+            submission_params["libraries"][0]["jar"] = self.upload_or_get_cloud_path(main_jar_path)
         # see here for the submission parameter definition https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--request-structure-6
         if python_files:
             # this is a pyspark job. definition here: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--sparkpythontask
             # the first file is the pyspark driver code. we only need the driver code to execute pyspark
-            param_and_file_dict = {"parameters": arguments, "python_file": self.upload_or_get_cloud_path(python_files[0])}
+            param_and_file_dict = {
+                "parameters": arguments,
+                "python_file": self.upload_or_get_cloud_path(python_files[0]),
+            }
             # indicates this is a pyspark job
             # `setdefault` method will get the value of the "spark_python_task" item, if the "spark_python_task" item does not exist, insert "spark_python_task" with the value "param_and_file_dict":
-            submission_params.setdefault('spark_python_task',param_and_file_dict)
+            submission_params.setdefault("spark_python_task", param_and_file_dict)
         else:
             # this is a scala spark job
-            submission_params['spark_jar_task']['parameters'] = arguments
-            submission_params['spark_jar_task']['main_class_name'] = main_class_name
+            submission_params["spark_jar_task"]["parameters"] = arguments
+            submission_params["spark_jar_task"]["main_class_name"] = main_class_name
 
         result = RunsApi(self.api_client).submit_run(submission_params)
 
         try:
             # see if we can parse the returned result
-            self.res_job_id = result['run_id']
+            self.res_job_id = result["run_id"]
         except:
-            logger.error("Submitting Feathr job to Databricks cluster failed. Message returned from Databricks: {}", result)
+            logger.error(
+                "Submitting Feathr job to Databricks cluster failed. Message returned from Databricks: {}", result
+            )
             exit(1)
 
         result = RunsApi(self.api_client).get_run(self.res_job_id)
-        self.job_url = result['run_page_url']
-        logger.info('Feathr job Submitted Successfully. View more details here: {}', self.job_url)
+        self.job_url = result["run_page_url"]
+        logger.info("Feathr job Submitted Successfully. View more details here: {}", self.job_url)
 
         # return ID as the submission result
         return self.res_job_id
 
     def wait_for_completion(self, timeout_seconds: Optional[int] = 600) -> bool:
-        """ Returns true if the job completed successfully
-        """
+        """Returns true if the job completed successfully"""
         start_time = time.time()
         while (timeout_seconds is None) or (time.time() - start_time < timeout_seconds):
             status = self.get_status()
-            logger.debug('Current Spark job status: {}', status)
+            logger.debug("Current Spark job status: {}", status)
             # see all the status here:
             # https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runlifecyclestate
             # https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runresultstate
-            if status in {'SUCCESS'}:
+            if status in {"SUCCESS"}:
                 return True
-            elif status in {'INTERNAL_ERROR', 'FAILED', 'TIMEDOUT', 'CANCELED'}:
+            elif status in {"INTERNAL_ERROR", "FAILED", "TIMEDOUT", "CANCELED"}:
                 result = RunsApi(self.api_client).get_run_output(self.res_job_id)
                 # See here for the returned fields: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--response-structure-8
                 # print out logs and stack trace if the job has failed
@@ -224,14 +258,14 @@ def wait_for_completion(self, timeout_seconds: Optional[int] = 600) -> bool:
             else:
                 time.sleep(30)
         else:
-            raise TimeoutError('Timeout waiting for Feathr job to complete')
+            raise TimeoutError("Timeout waiting for Feathr job to complete")
 
     def get_status(self) -> str:
         assert self.res_job_id is not None
         result = RunsApi(self.api_client).get_run(self.res_job_id)
         # first try to get result state. it might not be available, and if that's the case, try to get life_cycle_state
         # see result structure: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--response-structure-6
-        res_state = result['state'].get('result_state') or result['state']['life_cycle_state']
+        res_state = result["state"].get("result_state") or result["state"]["life_cycle_state"]
         assert res_state is not None
         return res_state
 
@@ -245,7 +279,6 @@ def get_job_result_uri(self) -> str:
         # in case users call this API even when there's no tags available
         return None if custom_tags is None else custom_tags[OUTPUT_PATH_TAG]
 
-
     def get_job_tags(self) -> Dict[str, str]:
         """Get job tags
 
@@ -256,21 +289,23 @@ def get_job_tags(self) -> Dict[str, str]:
         # For result structure, see https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--response-structure-6
         result = RunsApi(self.api_client).get_run(self.res_job_id)
 
-        if 'new_cluster' in result['cluster_spec']:
-            custom_tags = result['cluster_spec']['new_cluster']['custom_tags']
+        if "new_cluster" in result["cluster_spec"]:
+            custom_tags = result["cluster_spec"]["new_cluster"]["custom_tags"]
             return custom_tags
         else:
             # this is not a new cluster; it's an existing cluster.
-            logger.warning("Job tags are not available since you are using an existing Databricks cluster. Consider using 'new_cluster' in databricks configuration.")
+            logger.warning(
+                "Job tags are not available since you are using an existing Databricks cluster. Consider using 'new_cluster' in databricks configuration."
+            )
             return None
 
-
     def download_result(self, result_path: str, local_folder: str):
         """
         Supports downloading files from the result folder. Only support paths starts with `dbfs:/` and only support downloading files in one folder (per Spark's design, everything will be in the result folder in a flat manner)
         """
-        if not result_path.startswith('dbfs'):
-            raise RuntimeError('Currently only paths starting with dbfs is supported for downloading results from a databricks cluster. The path should start with \"dbfs:\" .')
+        if not result_path.startswith("dbfs"):
+            raise RuntimeError(
+                'Currently only paths starting with dbfs is supported for downloading results from a databricks cluster. The path should start with "dbfs:" .'
+            )
 
         DbfsApi(self.api_client).cp(recursive=True, overwrite=True, src=result_path, dst=local_folder)
-
diff --git a/feathr_project/feathr/utils/config.py b/feathr_project/feathr/utils/config.py
new file mode 100644
index 000000000..9a9438567
--- /dev/null
+++ b/feathr_project/feathr/utils/config.py
@@ -0,0 +1,61 @@
+from tempfile import NamedTemporaryFile
+
+
+FEATHR_CONFIG_TEMPLATE = """
+api_version: 1
+
+project_config:
+  project_name: {project_name}
+
+feature_registry:
+  api_endpoint: 'https://{resource_prefix}webapp.azurewebsites.net/api/v1'
+
+spark_config:
+  # Currently support: 'azure_synapse', 'databricks', and 'local'
+  spark_cluster: {spark_cluster}
+  spark_result_output_parts: '1'
+
+offline_store:
+  wasb:
+    wasb_enabled: true
+
+online_store:
+  # You can skip this part if you don't have Redis and skip materialization later in this notebook.
+  redis:
+    host: '{resource_prefix}redis.redis.cache.windows.net'
+    port: 6380
+    ssl_enabled: true
+"""
+
+
+def generate_config(
+    resource_prefix: str,
+    project_name: str,
+    spark_cluster: str,
+    output_filepath: str = None,
+) -> str:
+    """Generate a feathr config yaml file
+
+    Args:
+        resource_prefix: Resource name prefix.
+        project_name: Project name.
+        spark_cluster: Spark cluster to use. Either 'local', 'databricks', or 'azure_synapse'.
+        output_filepath: Output filepath.
+
+    Returns:
+        str: Generated config file path. output_filepath if provided. Otherwise, NamedTemporaryFile path.
+    """
+
+    conf_str = FEATHR_CONFIG_TEMPLATE.format(
+        resource_prefix=resource_prefix,
+        project_name=project_name,
+        spark_cluster=spark_cluster,
+    )
+
+    if not output_filepath:
+        output_filepath = NamedTemporaryFile(mode="w", delete=False).name
+
+    with open(output_filepath, "w") as conf_file:
+        conf_file.write(conf_str)
+
+    return output_filepath
diff --git a/feathr_project/feathr/utils/job_utils.py b/feathr_project/feathr/utils/job_utils.py
index 6a6bd63c0..815e26c21 100644
--- a/feathr_project/feathr/utils/job_utils.py
+++ b/feathr_project/feathr/utils/job_utils.py
@@ -1,77 +1,187 @@
-from feathr.client import FeathrClient
-import os
 import glob
-from feathr.constants import OUTPUT_FORMAT
+import os
+from pathlib import Path
+from tempfile import TemporaryDirectory
+from typing import Union
+
 from loguru import logger
 import pandas as pd
-import tempfile
 from pandas.errors import EmptyDataError
+from pyspark.sql import DataFrame, SparkSession
+
+from feathr.client import FeathrClient
+from feathr.constants import OUTPUT_FORMAT
 
 
+def get_result_pandas_df(
+    client: FeathrClient,
+    data_format: str = None,
+    res_url: str = None,
+    local_cache_path: str = None,
+) -> pd.DataFrame:
+    """Download the job result dataset from cloud as a Pandas DataFrame.
 
-def get_result_df(client: FeathrClient, format: str = None, res_url: str = None, local_folder: str = None) -> pd.DataFrame:
-    """Download the job result dataset from cloud as a Pandas dataframe to make it easier for the client to read.
+    Args:
+        client: Feathr client
+        data_format: Format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`.
+            Default to `avro` if not specified.
+        res_url: Result URL to download files from. Note that this will not block the job so you need to make sure
+            the job is finished and the result URL contains actual data.
+        local_cache_path (optional): Specify the absolute download path. if the user does not provide this,
+            the function will create a temporary directory.
 
-    format: format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`. Default to `avro` if not specified.
-    res_url: output URL to download files. Note that this will not block the job so you need to make sure the job is finished and result URL contains actual data.
-    local_folder: optional parameter to specify the absolute download path. if the user does not provide this, function will create a temporary directory and delete it after reading the dataframe.
+    Returns:
+        pandas DataFrame
     """
-    # use a result url if it's provided by the user, otherwise use the one provided by the job 
+    return get_result_df(client, data_format, res_url, local_cache_path)
+
+
+def get_result_spark_df(
+    spark: SparkSession,
+    client: FeathrClient,
+    data_format: str = None,
+    res_url: str = None,
+    local_cache_path: str = None,
+) -> DataFrame:
+    """Download the job result dataset from cloud as a Spark DataFrame.
+
+    Args:
+        spark: Spark session
+        client: Feathr client
+        data_format: Format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`.
+            Default to `avro` if not specified.
+        res_url: Result URL to download files from. Note that this will not block the job so you need to make sure
+            the job is finished and the result URL contains actual data.
+        local_cache_path (optional): Specify the absolute download path. if the user does not provide this,
+            the function will create a temporary directory.
+
+    Returns:
+        Spark DataFrame
+    """
+    return get_result_df(client, data_format, res_url, local_cache_path, spark=spark)
+
+
+def get_result_df(
+    client: FeathrClient,
+    data_format: str = None,
+    res_url: str = None,
+    local_cache_path: str = None,
+    spark: SparkSession = None,
+) -> Union[DataFrame, pd.DataFrame]:
+    """Download the job result dataset from cloud as a Spark DataFrame or pandas DataFrame.
+
+    Args:
+        client: Feathr client
+        data_format: Format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`.
+            Default to `avro` if not specified.
+        res_url: Result URL to download files from. Note that this will not block the job so you need to make sure
+            the job is finished and the result URL contains actual data.
+        local_cache_path (optional): Specify the absolute download path. if the user does not provide this,
+            the function will create a temporary directory.
+        spark (optional): Spark session. If provided, the function returns spark Dataframe.
+            Otherwise, it returns pd.DataFrame.
+
+    Returns:
+        Either Spark or pandas DataFrame.
+    """
+    # use a result url if it's provided by the user, otherwise use the one provided by the job
     res_url: str = res_url or client.get_job_result_uri(block=True, timeout_sec=1200)
     if res_url is None:
-        raise RuntimeError("res_url is None. Please make sure either you provide a res_url or make sure the job finished in FeathrClient has a valid result URI.")
+        raise RuntimeError(
+            "res_url is None. Please make sure either you provide a res_url or make sure the job finished in FeathrClient has a valid result URI."
+        )
+
+    if client.spark_runtime == "local":
+        if local_cache_path is not None:
+            logger.warning(
+                "In local spark mode, the result files are expected to be stored at a local storage and thus `local_cache_path` argument will be ignored."
+            )
+        local_cache_path = res_url
+    elif client.spark_runtime == "databricks":
+        if res_url.startswith("dbfs:"):
+            logger.warning(
+                "Result files are already in DBFS and thus `local_cache_path` will be ignored."
+            )
+            local_cache_path = res_url
+        else:
+            # if local_cache_path params is not provided then create a temporary folder
+            if local_cache_path is None:
+                # We'll just use the name of a local TemporaryDirectory to cache the data into DBFS.
+                local_cache_path = TemporaryDirectory().name
+
+            # Databricks uses "dbfs:/" prefix for spark paths
+            if not local_cache_path.startswith("dbfs:"):
+                local_cache_path = str(Path("dbfs:", local_cache_path.lstrip("/")))
+    # TODO elif azure_synapse
+
+    if local_cache_path != res_url:
+        logger.info(f"{res_url} files will be downloaded into {local_cache_path}")
+        client.feathr_spark_launcher.download_result(result_path=res_url, local_folder=local_cache_path)
 
-    # use user provided format, if there isn't one, then otherwise use the one provided by the job; 
+    # use user provided format, if there isn't one, then otherwise use the one provided by the job;
     # if none of them is available, "avro" is the default format.
-    format: str = format or client.get_job_tags().get(OUTPUT_FORMAT, "")
-    if format is None or format == "":
-        format = "avro"
+    data_format: str = data_format or client.get_job_tags().get(OUTPUT_FORMAT, "")
+    if data_format is None or data_format == "":
+        data_format = "avro"
 
-    # if local_folder params is not provided then create a temporary folder
-    if local_folder is not None:
-        local_dir_path = local_folder
+    result_df = None
+
+    if spark is not None:
+        result_df = spark.read.format(data_format).load(local_cache_path)
     else:
-        tmp_dir = tempfile.TemporaryDirectory()
-        local_dir_path = tmp_dir.name
-        
-    client.feathr_spark_launcher.download_result(result_path=res_url, local_folder=local_dir_path)
-    dataframe_list = []
-    # by default the result are in avro format
-    if format.casefold()=="parquet":
-        files =  glob.glob(os.path.join(local_dir_path, '*.parquet'))
+        result_df = _read_files_to_pandas_df(
+            dir_path=local_cache_path.replace("dbfs:", "/dbfs"),  # replace to python path if spark path is provided.
+            data_format=data_format,
+        )
+
+    return result_df
+
+
+def _read_files_to_pandas_df(dir_path: str, data_format: str = "avro") -> pd.DataFrame:
+
+    if data_format == "parquet":
         from pyarrow.parquet import ParquetDataset
+
+        files = glob.glob(os.path.join(dir_path, "*.parquet"))
         ds = ParquetDataset(files)
-        result_df = ds.read().to_pandas()
-    elif format.casefold()=="delta":
+        return ds.read().to_pandas()
+
+    elif data_format == "delta":
         from deltalake import DeltaTable
-        delta = DeltaTable(local_dir_path)
-        if not client.spark_runtime == 'azure_synapse':
-            # don't detect for synapse result with Delta as there's a problem with underlying system
-            # Issues are tracked here: https://github.com/delta-io/delta-rs/issues/582
-            result_df = delta.to_pyarrow_table().to_pandas()
-        else:
-            logger.info("Please use Azure Synapse to read the result in the Azure Synapse cluster. Reading local results is not supported for Azure Synapse. Empty DataFrame is returned.")
-            result_df = pd.DataFrame()
-    elif format.casefold()=="avro":
+
+        delta = DeltaTable(dir_path)
+        # if client.spark_runtime != "azure_synapse":
+        # don't detect for synapse result with Delta as there's a problem with underlying system
+        # Issues are tracked here: https://github.com/delta-io/delta-rs/issues/582
+        return delta.to_pyarrow_table().to_pandas()
+        # else:
+        # TODO -- Proper warning messages. Is this applied to all the other formats?
+        # raise RuntimeError(
+        #     "Please use Azure Synapse to read the result in the Azure Synapse cluster. Reading local results is not supported for Azure Synapse."
+        # )
+
+    elif data_format == "avro":
         import pandavro as pdx
-        for file in glob.glob(os.path.join(local_dir_path, '*.avro')):
-            dataframe_list.append(pdx.read_avro(file))
-        result_df = pd.concat(dataframe_list, axis=0)
-    elif format.casefold()=="csv":
-        for file in glob.glob(os.path.join(local_dir_path, '*.csv')):
+
+        dataframe_list = [pdx.read_avro(file) for file in glob.glob(os.path.join(dir_path, "*.avro"))]
+        return pd.concat(dataframe_list, axis=0)
+
+    elif data_format == "csv":
+        dataframe_list = []
+        for file in glob.glob(os.path.join(dir_path, "*.csv")):
             try:
-                df = pd.read_csv(file, index_col=None, header=None)
+                dataframe_list.append(pd.read_csv(file, index_col=None, header=None))
             except EmptyDataError:
                 # in case there are empty files
-                df = pd.DataFrame()
-            dataframe_list.append(df)
-        result_df = pd.concat(dataframe_list, axis=0)
-        # Reset index to avoid duplicated indices
-        result_df.reset_index(drop=True)
-    else:
-        raise RuntimeError(f"{format} is currently not supported in get_result_df. Currently only parquet, delta, avro, and csv are supported, please consider writing a customized function to read the result.")
+                pass
+
+        if dataframe_list:
+            # Reset index to avoid duplicated indices -- TODO don't we need reset_index when reading avro too?
+            return pd.concat(dataframe_list, axis=0).reset_index(drop=True)
+        else:
+            raise ValueError(f"Empty files in {dir_path}.")
 
-    
-    if local_folder is None:
-        tmp_dir.cleanup()
-    return result_df
\ No newline at end of file
+    else:
+        raise ValueError(
+            f"{data_format} is currently not supported in get_result_df. Currently only parquet, delta, avro, and csv are supported, please consider writing a customized function to read the result."
+        )
diff --git a/feathr_project/feathr/utils/platform.py b/feathr_project/feathr/utils/platform.py
new file mode 100644
index 000000000..8f832f22d
--- /dev/null
+++ b/feathr_project/feathr/utils/platform.py
@@ -0,0 +1,45 @@
+"""Platform utilities.
+Refs: https://github.com/microsoft/recommenders/blob/main/recommenders/utils/notebook_utils.py
+"""
+from pathlib import Path
+
+
+def is_jupyter() -> bool:
+    """Check if the module is running on Jupyter notebook/console.
+    Note - there might be better way to check if the code is running on a jupyter notebook or not,
+    but this hacky way still works.
+
+    Ref:
+        https://stackoverflow.com/questions/15411967/how-can-i-check-if-code-is-executed-in-the-ipython-notebook
+
+    Returns:
+        bool: True if the module is running on Jupyter notebook or Jupyter console, False otherwise.
+    """
+    try:
+        # Pre-loaded module `get_ipython()` tells you whether you are running inside IPython or not.
+        shell_name = get_ipython().__class__.__name__
+        # `ZMQInteractiveShell` tells you if this is an interactive mode (notebook).
+        if shell_name == "ZMQInteractiveShell":
+            return True
+        else:
+            return False
+    except NameError:
+        return False
+
+
+def is_databricks() -> bool:
+    """Check if the module is running on Databricks.
+
+    Returns:
+        bool: True if the module is running on Databricks notebook, False otherwise.
+    """
+    try:
+        if str(Path(".").resolve()) == "/databricks/driver":
+            return True
+        else:
+            return False
+    except NameError:
+        return False
+
+
+# TODO maybe add is_synapse()
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv
deleted file mode 100644
index ce34f255a..000000000
--- a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv
+++ /dev/null
@@ -1,14 +0,0 @@
-VendorID,lpep_pickup_datetime,lpep_dropoff_datetime,store_and_fwd_flag,RatecodeID,PULocationID,DOLocationID,passenger_count,trip_distance,fare_amount,extra,mta_tax,tip_amount,tolls_amount,ehail_fee,improvement_surcharge,total_amount,payment_type,trip_type,congestion_surcharge
-2,2021-01-01 00:15:56,2021-01-01 00:19:52,N,1,43,151,1,1.01,5.5,0.5,0.5,0,0,,0.3,6.8,2,1,0
-22,2021-01-01 11:25:59,2021-01-01 11:34:44,N,1,166,239,1,2.53,10,0.5,0.5,2.81,0,,0.3,16.86,1,1,2.75
-23,2021-01-01 00:45:57,2021-01-01 00:51:55,N,1,41,42,1,1.12,6,0.5,0.5,1,0,,0.3,8.3,1,1,0
-24,2020-12-31 23:57:51,2021-01-01 23:04:56,N,1,168,75,1,1.99,8,0.5,0.5,0,0,,0.3,9.3,2,1,0
-25,2021-01-01 17:16:36,2021-01-01 17:16:40,N,2,265,265,3,.00,-52,0,-0.5,0,0,,-0.3,-52.8,3,1,0
-12,2021-01-01 00:16:36,2021-01-01 00:16:40,N,2,265,265,3,.00,52,0,0.5,0,0,,0.3,52.8,2,1,0
-42,2021-01-01 05:19:14,2021-01-01 00:19:21,N,5,265,265,1,.00,180,0,0,36.06,0,,0.3,216.36,1,2,0
-52,2021-01-01 00:26:31,2021-01-01 00:28:50,N,1,75,75,6,.45,3.5,0.5,0.5,0.96,0,,0.3,5.76,1,1,0
-2,2021-01-01 00:57:46,2021-01-01 00:57:57,N,1,225,225,1,.00,2.5,0.5,0.5,0,0,,0.3,3.8,2,1,0
-32,2021-01-01 00:58:32,2021-01-01 01:32:34,N,1,225,265,1,12.19,38,0.5,0.5,2.75,0,,0.3,42.05,1,1,0
-2,2021-01-01 18:39:57,2021-01-01 18:55:25,N,1,74,60,1,5.48,18,0.5,0.5,0,0,,0.3,19.3,2,1,0
-15,2021-01-01 00:51:27,2021-01-01 00:57:20,N,1,42,41,2,.90,6,0.5,0.5,0,0,,0.3,7.3,1,1,0
-15,2021-01-01 00:29:05,2021-01-01 00:29:07,N,5,42,264,1,9.00E-02,10,0,0,2.06,0,,0.3,12.36,1,2,0
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv
deleted file mode 100644
index 476ea06f3..000000000
--- a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv
+++ /dev/null
@@ -1,11 +0,0 @@
-product_id,category,price,quantity,recent_sold,made_in_state,discount
-1,1,22,100,0,CA,7.5
-2,2,17,300,1,CA,7.5
-3,1,40,0,2,WA,7.5
-4,1,25,100,3,WA,7.5
-5,1,33,0,2,PA,0
-6,2,19,0,2,CA,7.5
-7,2,22,200,1,WA,7.5
-8,2,59,300,0,PA,8.5
-9,0,80,100,1,WA,8.5
-10,0,39,100,0,WA,7.5
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv
deleted file mode 100644
index 38fe25ceb..000000000
--- a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv
+++ /dev/null
@@ -1,35 +0,0 @@
-user_id,product_id,event_timestamp,product_rating
-1,1,2021-04-01,4
-1,2,2021-04-01,4
-1,3,2021-04-01,4
-1,4,2021-04-01,4
-1,5,2021-04-01,4
-2,1,2021-04-01,5
-2,2,2021-04-01,5
-2,3,2021-04-01,5
-2,4,2021-04-01,5
-2,5,2021-04-01,5
-3,1,2021-04-01,5
-3,2,2021-04-01,5
-3,3,2021-04-01,5
-3,4,2021-04-01,5
-3,5,2021-04-01,5
-4,1,2021-04-01,1
-4,2,2021-04-01,1
-4,3,2021-04-01,1
-4,4,2021-04-01,1
-4,5,2021-04-01,1
-5,1,2021-04-01,5
-5,2,2021-04-01,5
-6,1,2021-04-01,2
-7,1,2021-04-01,5
-7,2,2021-04-01,5
-7,3,2021-04-01,5
-8,1,2021-04-01,2
-8,2,2021-04-01,2
-8,3,2021-04-01,2
-9,1,2021-04-01,5
-9,2,2021-04-01,5
-9,3,2021-04-01,5
-9,4,2021-04-01,5
-10,1,2021-04-01,3
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv
deleted file mode 100644
index 6c38f51d7..000000000
--- a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv
+++ /dev/null
@@ -1,11 +0,0 @@
-user_id,gender,age,gift_card_balance,number_of_credit_cards,state,tax_rate
-1,1,22,100,0,CA,7.5
-2,2,17,300,1,CA,7.5
-3,1,40,0,2,WA,7.5
-4,1,25,100,3,WA,7.5
-5,1,33,0,2,PA,0
-6,2,19,0,2,CA,7.5
-7,2,22,200,1,WA,7.5
-8,2,59,300,0,PA,8.5
-9,0,80,100,1,WA,8.5
-10,0,39,100,0,WA,7.5
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv
deleted file mode 100644
index 8c8481d1f..000000000
--- a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv
+++ /dev/null
@@ -1,31 +0,0 @@
-user_id,purchase_date,purchase_amount
-1,2021-01-01,0.33
-1,2021-03-03,574.35
-1,2021-01-03,796.07
-2,2021-01-04,342.15
-2,2021-03-05,280.46
-2,2021-01-06,664.18
-3,2021-01-07,359.02
-3,2021-01-08,357.12
-3,2021-01-09,845.40
-4,2021-01-10,103.92
-4,2021-02-21,670.12
-4,2021-02-12,698.65
-5,2021-01-13,110.52
-5,2021-01-14,931.72
-5,2021-02-15,388.14
-6,2021-01-16,822.96
-6,2021-01-17,292.39
-6,2021-01-18,524.76
-7,2021-01-19,262.00
-7,2021-03-20,715.94
-7,2021-01-21,345.70
-8,2021-01-22,379.00
-8,2021-01-23,194.96
-8,2021-01-24,862.33
-9,2021-01-25,430.41
-9,2021-01-26,398.72
-9,2021-02-27,158.52
-10,2021-01-28,550.01
-10,2021-03-02,157.88
-10,2021-03-03,528.43
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb b/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
deleted file mode 100644
index 38cec2ca9..000000000
--- a/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
+++ /dev/null
@@ -1,720 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "# Feathr Feature Store on Azure Demo Notebook\n",
-        "\n",
-        "This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. It includes these steps:\n",
-        "\n",
-        "\n",
-        "This tutorial demonstrates the key capabilities of Feathr, including:\n",
-        "\n",
-        "1. Install and set up Feathr with Azure\n",
-        "2. Create shareable features with Feathr feature definition configs.\n",
-        "3. Create a training dataset via point-in-time feature join.\n",
-        "4. Compute and write features.\n",
-        "5. Train a model using these features to predict fares.\n",
-        "6. Materialize feature value to online store.\n",
-        "7. Fetch feature value in real-time from online store for online scoring.\n",
-        "\n",
-        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The feature flow is as below:\n",
-        "\n",
-        "![Feature Flow](https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Prerequisite: Use Quick Start Template to Provision Azure Resources\n",
-        "First step is to provision required cloud resources if you want to use Feathr. Feathr provides a python based client to interact with cloud resources.\n",
-        "\n",
-        "Please follow the steps [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to provision required cloud resources. Due to the complexity of the possible cloud environment, it is almost impossible to create a script that works for all the use cases. Because of this, [azure_resource_provision.sh](https://github.com/linkedin/feathr/blob/main/docs/how-to-guides/azure_resource_provision.sh) is a full end to end command line to create all the required resources, and you can tailor the script as needed, while [the companion documentation](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) can be used as a complete guide for using that shell script.\n",
-        "\n",
-        "\n",
-        "![Architecture](https://github.com/linkedin/feathr/blob/main/docs/images/architecture.png?raw=true)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Prerequisite: Install Feathr \n",
-        "\n",
-        "Install Feathr using pip:\n",
-        "\n",
-        "`pip install -U feathr pandavro scikit-learn`"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Prerequisite: Configure the required environment with Feathr Quick Start Template\n",
-        "\n",
-        "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. Run the code below to install Feathr, login to Azure to get the required credentials to access more cloud resources."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "**REQUIRED STEP: Fill in the resource prefix when provisioning the resources**"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "resource_prefix = \"feathr_resource_prefix\""
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "! pip install feathr azure-cli  pandavro scikit-learn"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "Login to Azure with a device code (You will see instructions in the output):"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "! az login --use-device-code"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "import glob\n",
-        "import os\n",
-        "import tempfile\n",
-        "from datetime import datetime, timedelta\n",
-        "from math import sqrt\n",
-        "\n",
-        "import pandas as pd\n",
-        "import pandavro as pdx\n",
-        "from feathr import FeathrClient\n",
-        "from feathr import BOOLEAN, FLOAT, INT32, ValueType\n",
-        "from feathr import Feature, DerivedFeature, FeatureAnchor\n",
-        "from feathr import BackfillTime, MaterializationSettings\n",
-        "from feathr import FeatureQuery, ObservationSettings\n",
-        "from feathr import RedisSink\n",
-        "from feathr import INPUT_CONTEXT, HdfsSource\n",
-        "from feathr import WindowAggTransformation\n",
-        "from feathr import TypedKey\n",
-        "from sklearn.metrics import mean_squared_error\n",
-        "from sklearn.model_selection import train_test_split\n",
-        "from azure.identity import DefaultAzureCredential\n",
-        "from azure.keyvault.secrets import SecretClient\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "Get all the required credentials from Azure KeyVault"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "# Get all the required credentials from Azure Key Vault\n",
-        "key_vault_name=resource_prefix+\"kv\"\n",
-        "synapse_workspace_url=resource_prefix+\"syws\"\n",
-        "adls_account=resource_prefix+\"dls\"\n",
-        "adls_fs_name=resource_prefix+\"fs\"\n",
-        "purview_name=resource_prefix+\"purview\"\n",
-        "key_vault_uri = f\"https://{key_vault_name}.vault.azure.net\"\n",
-        "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False)\n",
-        "client = SecretClient(vault_url=key_vault_uri, credential=credential)\n",
-        "secretName = \"FEATHR-ONLINE-STORE-CONN\"\n",
-        "retrieved_secret = client.get_secret(secretName).value\n",
-        "\n",
-        "# Get redis credentials; This is to parse Redis connection string.\n",
-        "redis_port=retrieved_secret.split(',')[0].split(\":\")[1]\n",
-        "redis_host=retrieved_secret.split(',')[0].split(\":\")[0]\n",
-        "redis_password=retrieved_secret.split(',')[1].split(\"password=\",1)[1]\n",
-        "redis_ssl=retrieved_secret.split(',')[2].split(\"ssl=\",1)[1]\n",
-        "\n",
-        "# Set the resource link\n",
-        "os.environ['spark_config__azure_synapse__dev_url'] = f'https://{synapse_workspace_url}.dev.azuresynapse.net'\n",
-        "os.environ['spark_config__azure_synapse__pool_name'] = 'spark31'\n",
-        "os.environ['spark_config__azure_synapse__workspace_dir'] = f'abfss://{adls_fs_name}@{adls_account}.dfs.core.windows.net/feathr_project'\n",
-        "os.environ['online_store__redis__host'] = redis_host\n",
-        "os.environ['online_store__redis__port'] = redis_port\n",
-        "os.environ['online_store__redis__ssl_enabled'] = redis_ssl\n",
-        "os.environ['REDIS_PASSWORD']=redis_password\n",
-        "feathr_output_path = f'abfss://{adls_fs_name}@{adls_account}.dfs.core.windows.net/feathr_output'"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Prerequisite: Configure the required environment (Don't need to update if using the above Quick Start Template)\n",
-        "\n",
-        "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. If you use Feathr CLI to create a workspace, you should have a folder with a file called `feathr_config.yaml` in it with all the required configurations. Otherwise, update the configuration below.\n",
-        "\n",
-        "The code below will write this configuration string to a temporary location and load it to Feathr. Please still refer to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It should also have more explanations on the meaning of each variable."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "import tempfile\n",
-        "yaml_config = \"\"\"\n",
-        "# Please refer to https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
-        "api_version: 1\n",
-        "project_config:\n",
-        "  project_name: 'feathr_getting_started'\n",
-        "  required_environment_variables:\n",
-        "    - 'REDIS_PASSWORD'\n",
-        "    - 'AZURE_CLIENT_ID'\n",
-        "    - 'AZURE_TENANT_ID'\n",
-        "    - 'AZURE_CLIENT_SECRET'\n",
-        "offline_store:\n",
-        "  adls:\n",
-        "    adls_enabled: true\n",
-        "  wasb:\n",
-        "    wasb_enabled: true\n",
-        "  s3:\n",
-        "    s3_enabled: false\n",
-        "    s3_endpoint: 's3.amazonaws.com'\n",
-        "  jdbc:\n",
-        "    jdbc_enabled: false\n",
-        "    jdbc_database: 'feathrtestdb'\n",
-        "    jdbc_table: 'feathrtesttable'\n",
-        "  snowflake:\n",
-        "    url: \"dqllago-ol19457.snowflakecomputing.com\"\n",
-        "    user: \"feathrintegration\"\n",
-        "    role: \"ACCOUNTADMIN\"\n",
-        "spark_config:\n",
-        "  spark_cluster: 'azure_synapse'\n",
-        "  spark_result_output_parts: '1'\n",
-        "  azure_synapse:\n",
-        "    dev_url: 'https://feathrazuretest3synapse.dev.azuresynapse.net'\n",
-        "    pool_name: 'spark3'\n",
-        "    workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_getting_started'\n",
-        "    executor_size: 'Small'\n",
-        "    executor_num: 1\n",
-        "  databricks:\n",
-        "    workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net'\n",
-        "    config_template: {'run_name':'','new_cluster':{'spark_version':'9.1.x-scala2.12','node_type_id':'Standard_D3_v2','num_workers':2,'spark_conf':{}},'libraries':[{'jar':''}],'spark_jar_task':{'main_class_name':'','parameters':['']}}\n",
-        "    work_dir: 'dbfs:/feathr_getting_started'\n",
-        "online_store:\n",
-        "  redis:\n",
-        "    host: 'feathrazuretest3redis.redis.cache.windows.net'\n",
-        "    port: 6380\n",
-        "    ssl_enabled: True\n",
-        "feature_registry:\n",
-        "  api_endpoint: \"https://feathr-sql-registry.azurewebsites.net/api/v1\"\n",
-        "\"\"\"\n",
-        "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
-        "with open(tmp.name, \"w\") as text_file:\n",
-        "    text_file.write(yaml_config)\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Setup necessary environment variables (Skip if using the above Quick Start Template)\n",
-        "\n",
-        "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
-        "\n",
-        "To run this notebook, for Azure users, you need AZURE_CLIENT_ID, AZURE_TENANT_ID, AZURE_CLIENT_SECRET and REDIS_PASSWORD.\n",
-        "To run this notebook, for Databricks useres, you need DATABRICKS_WORKSPACE_TOKEN_VALUE and REDIS_PASSWORD."
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "# Initialize Feathr Client"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "client = FeathrClient(config_path=tmp.name)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## View the data\n",
-        "\n",
-        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The data is as below"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "import pandas as pd\n",
-        "pd.read_csv(\"https://azurefeathrstorage.blob.core.windows.net/public/sample_data/green_tripdata_2020-04_with_index.csv\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Defining Features with Feathr\n",
-        "\n",
-        "In Feathr, a feature is viewed as a function, mapping from entity id or key, and timestamp to a feature value. For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/linkedin/feathr/blob/main/docs/concepts/feature-definition.md)\n",
-        "\n",
-        "\n",
-        "1. The typed key (a.k.a. entity id) identifies the subject of feature, e.g. a user id, 123.\n",
-        "2. The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n",
-        "3. The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "Note that, in some cases, such as features defined on top of request data, may have no entity key or timestamp.\n",
-        "It is merely a function/transformation executing against request data at runtime.\n",
-        "For example, the day of week of the request, which is calculated by converting the request UNIX timestamp.\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Define Sources Section with UDFs\n",
-        "A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. See the python documentation to get the details on each input column.\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "from pyspark.sql import SparkSession, DataFrame\n",
-        "def feathr_udf_day_calc(df: DataFrame) -> DataFrame:\n",
-        "    from pyspark.sql.functions import dayofweek, dayofyear, col\n",
-        "    df = df.withColumn(\"fare_amount_cents\", col(\"fare_amount\")*100)\n",
-        "    return df\n",
-        "\n",
-        "batch_source = HdfsSource(name=\"nycTaxiBatchSource\",\n",
-        "                          path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
-        "                          event_timestamp_column=\"lpep_dropoff_datetime\",\n",
-        "                          preprocessing=feathr_udf_day_calc,\n",
-        "                          timestamp_format=\"yyyy-MM-dd HH:mm:ss\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Define Anchors and Features\n",
-        "A feature is called an anchored feature when the feature is directly extracted from the source data, rather than computed on top of other features. The latter case is called derived feature."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "f_trip_distance = Feature(name=\"f_trip_distance\",\n",
-        "                          feature_type=FLOAT, transform=\"trip_distance\")\n",
-        "f_trip_time_duration = Feature(name=\"f_trip_time_duration\",\n",
-        "                               feature_type=INT32,\n",
-        "                               transform=\"(to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime))/60\")\n",
-        "\n",
-        "features = [\n",
-        "    f_trip_distance,\n",
-        "    f_trip_time_duration,\n",
-        "    Feature(name=\"f_is_long_trip_distance\",\n",
-        "            feature_type=BOOLEAN,\n",
-        "            transform=\"cast_float(trip_distance)>30\"),\n",
-        "    Feature(name=\"f_day_of_week\",\n",
-        "            feature_type=INT32,\n",
-        "            transform=\"dayofweek(lpep_dropoff_datetime)\"),\n",
-        "]\n",
-        "\n",
-        "request_anchor = FeatureAnchor(name=\"request_features\",\n",
-        "                               source=INPUT_CONTEXT,\n",
-        "                               features=features)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Window aggregation features\n",
-        "\n",
-        "For window aggregation features, see the supported fields below:\n",
-        "\n",
-        "Note that the `agg_func` should be any of these:\n",
-        "\n",
-        "| Aggregation Type | Input Type | Description |\n",
-        "| --- | --- | --- |\n",
-        "|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n",
-        "|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n",
-        "|LATEST| Any |Returns the latest not-null values from within the defined time window |\n",
-        "\n",
-        "\n",
-        "After you have defined features and sources, bring them together to build an anchor:\n",
-        "\n",
-        "\n",
-        "Note that if the data source is from the observation data, the `source` section should be `INPUT_CONTEXT` to indicate the source of those defined anchors."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "location_id = TypedKey(key_column=\"DOLocationID\",\n",
-        "                       key_column_type=ValueType.INT32,\n",
-        "                       description=\"location id in NYC\",\n",
-        "                       full_name=\"nyc_taxi.location_id\")\n",
-        "agg_features = [Feature(name=\"f_location_avg_fare\",\n",
-        "                        key=location_id,\n",
-        "                        feature_type=FLOAT,\n",
-        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
-        "                                                          agg_func=\"AVG\",\n",
-        "                                                          window=\"90d\")),\n",
-        "                Feature(name=\"f_location_max_fare\",\n",
-        "                        key=location_id,\n",
-        "                        feature_type=FLOAT,\n",
-        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
-        "                                                          agg_func=\"MAX\",\n",
-        "                                                          window=\"90d\")),\n",
-        "                Feature(name=\"f_location_total_fare_cents\",\n",
-        "                        key=location_id,\n",
-        "                        feature_type=FLOAT,\n",
-        "                        transform=WindowAggTransformation(agg_expr=\"fare_amount_cents\",\n",
-        "                                                          agg_func=\"SUM\",\n",
-        "                                                          window=\"90d\")),\n",
-        "                ]\n",
-        "\n",
-        "agg_anchor = FeatureAnchor(name=\"aggregationFeatures\",\n",
-        "                           source=batch_source,\n",
-        "                           features=agg_features)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Derived Features Section\n",
-        "Derived features are the features that are computed from other features. They could be computed from anchored features, or other derived features."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "f_trip_time_distance = DerivedFeature(name=\"f_trip_time_distance\",\n",
-        "                                      feature_type=FLOAT,\n",
-        "                                      input_features=[\n",
-        "                                          f_trip_distance, f_trip_time_duration],\n",
-        "                                      transform=\"f_trip_distance * f_trip_time_duration\")\n",
-        "\n",
-        "f_trip_time_rounded = DerivedFeature(name=\"f_trip_time_rounded\",\n",
-        "                                     feature_type=INT32,\n",
-        "                                     input_features=[f_trip_time_duration],\n",
-        "                                     transform=\"f_trip_time_duration % 10\")\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "And then we need to build those features so that it can be consumed later. Note that we have to build both the \"anchor\" and the \"derived\" features (which is not anchored to a source)."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "client.build_features(anchor_list=[agg_anchor, request_anchor], derived_feature_list=[\n",
-        "                      f_trip_time_distance, f_trip_time_rounded])"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Create training data using point-in-time correct feature join\n",
-        "\n",
-        "A training dataset usually contains entity id columns, multiple feature columns, event timestamp column and label/target column. \n",
-        "\n",
-        "To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n",
-        "what features and how these features should be joined to the observation data. \n",
-        "\n",
-        "To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "if client.spark_runtime == 'databricks':\n",
-        "    output_path = 'dbfs:/feathrazure_test.avro'\n",
-        "else:\n",
-        "    output_path = feathr_output_path\n",
-        "\n",
-        "\n",
-        "feature_query = FeatureQuery(\n",
-        "    feature_list=[\"f_location_avg_fare\", \"f_trip_time_rounded\", \"f_is_long_trip_distance\", \"f_location_total_fare_cents\"], key=location_id)\n",
-        "settings = ObservationSettings(\n",
-        "    observation_path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
-        "    event_timestamp_column=\"lpep_dropoff_datetime\",\n",
-        "    timestamp_format=\"yyyy-MM-dd HH:mm:ss\")\n",
-        "client.get_offline_features(observation_settings=settings,\n",
-        "                            feature_query=feature_query,\n",
-        "                            output_path=output_path)\n",
-        "client.wait_job_to_finish(timeout_sec=500)"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Download the result and show the result\n",
-        "\n",
-        "Let's use the helper function `get_result_df` to download the result and view it:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "def get_result_df(client: FeathrClient) -> pd.DataFrame:\n",
-        "    \"\"\"Download the job result dataset from cloud as a Pandas dataframe.\"\"\"\n",
-        "    res_url = client.get_job_result_uri(block=True, timeout_sec=600)\n",
-        "    tmp_dir = tempfile.TemporaryDirectory()\n",
-        "    client.feathr_spark_launcher.download_result(result_path=res_url, local_folder=tmp_dir.name)\n",
-        "    dataframe_list = []\n",
-        "    # assuming the result are in avro format\n",
-        "    for file in glob.glob(os.path.join(tmp_dir.name, '*.avro')):\n",
-        "        dataframe_list.append(pdx.read_avro(file))\n",
-        "    vertical_concat_df = pd.concat(dataframe_list, axis=0)\n",
-        "    tmp_dir.cleanup()\n",
-        "    return vertical_concat_df\n",
-        "\n",
-        "df_res = get_result_df(client)"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "df_res"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Train a machine learning model\n",
-        "After getting all the features, let's train a machine learning model with the converted feature by Feathr:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "# remove columns\n",
-        "from sklearn.ensemble import GradientBoostingRegressor\n",
-        "final_df = df_res\n",
-        "final_df.drop([\"lpep_pickup_datetime\", \"lpep_dropoff_datetime\",\n",
-        "              \"store_and_fwd_flag\"], axis=1, inplace=True, errors='ignore')\n",
-        "final_df.fillna(0, inplace=True)\n",
-        "final_df['fare_amount'] = final_df['fare_amount'].astype(\"float64\")\n",
-        "\n",
-        "\n",
-        "train_x, test_x, train_y, test_y = train_test_split(final_df.drop([\"fare_amount\"], axis=1),\n",
-        "                                                    final_df[\"fare_amount\"],\n",
-        "                                                    test_size=0.2,\n",
-        "                                                    random_state=42)\n",
-        "model = GradientBoostingRegressor()\n",
-        "model.fit(train_x, train_y)\n",
-        "\n",
-        "y_predict = model.predict(test_x)\n",
-        "\n",
-        "y_actual = test_y.values.flatten().tolist()\n",
-        "rmse = sqrt(mean_squared_error(y_actual, y_predict))\n",
-        "\n",
-        "sum_actuals = sum_errors = 0\n",
-        "\n",
-        "for actual_val, predict_val in zip(y_actual, y_predict):\n",
-        "    abs_error = actual_val - predict_val\n",
-        "    if abs_error < 0:\n",
-        "        abs_error = abs_error * -1\n",
-        "\n",
-        "    sum_errors = sum_errors + abs_error\n",
-        "    sum_actuals = sum_actuals + actual_val\n",
-        "\n",
-        "mean_abs_percent_error = sum_errors / sum_actuals\n",
-        "print(\"Model MAPE:\")\n",
-        "print(mean_abs_percent_error)\n",
-        "print()\n",
-        "print(\"Model Accuracy:\")\n",
-        "print(1 - mean_abs_percent_error)\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Materialize feature value into offline/online storage\n",
-        "\n",
-        "While Feathr can compute the feature value from the feature definition on-the-fly at request time, it can also pre-compute\n",
-        "and materialize the feature value to offline and/or online storage. \n",
-        "\n",
-        "We can push the generated features to the online store like below:\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "backfill_time = BackfillTime(start=datetime(\n",
-        "    2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))\n",
-        "redisSink = RedisSink(table_name=\"nycTaxiDemoFeature\")\n",
-        "settings = MaterializationSettings(\"nycTaxiTable\",\n",
-        "                                   backfill_time=backfill_time,\n",
-        "                                   sinks=[redisSink],\n",
-        "                                   feature_names=[\"f_location_avg_fare\", \"f_location_max_fare\"])\n",
-        "\n",
-        "client.materialize_features(settings)\n",
-        "client.wait_job_to_finish(timeout_sec=500)\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "We can then get the features from the online store (Redis):\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Fetching feature value for online inference\n",
-        "\n",
-        "For features that are already materialized by the previous step, their latest value can be queried via the client's\n",
-        "`get_online_features` or `multi_get_online_features` API."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "res = client.get_online_features('nycTaxiDemoFeature', '265', [\n",
-        "                                 'f_location_avg_fare', 'f_location_max_fare'])"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "client.multi_get_online_features(\"nycTaxiDemoFeature\", [\"239\", \"265\"], [\n",
-        "                                 'f_location_avg_fare', 'f_location_max_fare'])\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Registering and Fetching features\n",
-        "\n",
-        "We can also register the features with an Apache Atlas compatible service, such as Azure Purview, and share the registered features across teams:"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "client.register_features()\n",
-        "client.list_registered_features(project_name=\"feathr_getting_started\")"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3.9.5 ('base')",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.9.5"
-    },
-    "vscode": {
-      "interpreter": {
-        "hash": "3d597f4c481aa0f25dceb95d2a0067e73c0966dcbd003d741d821a7208527ecf"
-      }
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 2
-}
diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index 69a99351f..0a6b38d49 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -3,6 +3,7 @@
 from setuptools import setup, find_packages
 from pathlib import Path
 
+
 # Use the README.md from /docs
 root_path = Path(__file__).resolve().parent.parent
 long_description = (root_path / "docs/README.md").read_text(encoding="utf8")
@@ -15,7 +16,7 @@
     sys.exit(-1)
 
 VERSION = __version__  # noqa
-os.environ["FEATHR_VERSION]"] = VERSION
+os.environ["FEATHR_VERSION"] = VERSION
 
 extras_require=dict(
     dev=[
diff --git a/feathr_project/test/samples/test_notebooks.py b/feathr_project/test/samples/test_notebooks.py
new file mode 100644
index 000000000..778b157d7
--- /dev/null
+++ b/feathr_project/test/samples/test_notebooks.py
@@ -0,0 +1,56 @@
+from pathlib import Path
+from tempfile import TemporaryDirectory
+
+import pytest
+try:
+    import papermill as pm
+    import scrapbook as sb
+except ImportError:
+    pass  # disable error while collecting tests for non-notebook environments
+
+
+SAMPLES_DIR = (
+    Path(__file__)
+    .parent     # .../samples
+    .parent     # .../test
+    .parent     # .../feathr_project
+    .parent     # .../feathr (root of the repo)
+    .joinpath("docs", "samples")
+)
+NOTEBOOK_PATHS = {
+    "nyc_taxi_demo": str(SAMPLES_DIR.joinpath("nyc_taxi_demo.ipynb")),
+}
+
+
+@pytest.mark.notebooks
+def test__nyc_taxi_demo(tmp_path):
+    notebook_name = "nyc_taxi_demo"
+
+    output_tmpdir = TemporaryDirectory()
+    output_notebook_path = str(tmp_path.joinpath(f"{notebook_name}.ipynb"))
+
+    pm.execute_notebook(
+        input_path=NOTEBOOK_PATHS[notebook_name],
+        output_path=output_notebook_path,
+        # kernel_name="python3",
+        parameters=dict(
+            RESOURCE_PREFIX="feathrazuretest3",  # Use the test resource group
+            PROJECT_NAME=notebook_name,
+            DATA_STORE_PATH=output_tmpdir.name,
+            SPARK_CLUSTER="local",
+            USE_CLI_AUTH=False,
+            SCRAP_RESULTS=True,
+        ),
+    )
+
+    # Read results from the Scrapbook and assert expected values
+    nb = sb.read_notebook(output_notebook_path)
+    outputs = nb.scraps
+
+    assert outputs["materialized_feature_values"].data["239"] == pytest.approx([5707., 1480.], abs=1.)
+    assert outputs["materialized_feature_values"].data["265"] == pytest.approx([10000., 4160.], abs=1.)
+    assert outputs["rmse"].data == pytest.approx(5., abs=2.)
+    assert outputs["mae"].data == pytest.approx(2., abs=1.)
+
+    # clean up
+    output_tmpdir.cleanup()
diff --git a/feathr_project/test/unit/datasets/test_dataset_utils.py b/feathr_project/test/unit/datasets/test_dataset_utils.py
new file mode 100644
index 000000000..2aabaa9a1
--- /dev/null
+++ b/feathr_project/test/unit/datasets/test_dataset_utils.py
@@ -0,0 +1,53 @@
+from pathlib import Path
+from tempfile import TemporaryDirectory
+from urllib.parse import urlparse
+
+import pytest
+
+from feathr.datasets.nyc_taxi import NYC_TAXI_SMALL_URL
+from feathr.datasets.utils import maybe_download
+
+
+@pytest.mark.parametrize(
+    # 3924447 is the nyc_taxi sample data's bytes
+    "expected_bytes", [3924447, None]
+)
+def test__maybe_download(expected_bytes: int):
+    """Test maybe_download utility function w/ nyc_taxi data cached at Azure blob."""
+
+    tmpdir = TemporaryDirectory()
+    dst_filepath = Path(tmpdir.name, "data.csv")
+
+    # Assert the data is downloaded
+    assert maybe_download(
+        src_url=NYC_TAXI_SMALL_URL,
+        dst_filepath=str(dst_filepath),
+        expected_bytes=expected_bytes,
+    )
+
+    # Assert the downloaded file exists.
+    assert dst_filepath.is_file()
+
+    # Assert the data is already exists and thus the function does not download
+    assert not maybe_download(
+        src_url=NYC_TAXI_SMALL_URL,
+        dst_filepath=str(dst_filepath),
+        expected_bytes=expected_bytes,
+    )
+
+    tmpdir.cleanup()
+
+
+def test__maybe_download__raise_exception():
+    """Test maby_download utility function to raise IOError when the expected bytes mismatches."""
+
+    tmpdir = TemporaryDirectory()
+
+    with pytest.raises(IOError):
+        maybe_download(
+            src_url=NYC_TAXI_SMALL_URL,
+            dst_filepath=Path(tmpdir.name, "data.csv").resolve(),
+            expected_bytes=10,
+        )
+
+    tmpdir.cleanup()
diff --git a/feathr_project/test/unit/datasets/test_datasets.py b/feathr_project/test/unit/datasets/test_datasets.py
new file mode 100644
index 000000000..c1ac49a9b
--- /dev/null
+++ b/feathr_project/test/unit/datasets/test_datasets.py
@@ -0,0 +1,106 @@
+from pathlib import Path
+from unittest.mock import MagicMock
+
+from pyspark.sql import SparkSession
+import pytest
+from pytest_mock import MockerFixture
+
+from feathr.datasets import nyc_taxi
+
+
+TEST_DATASET_DIR = Path(__file__).parent.parent.parent.joinpath("test_user_workspace")
+NYC_TAXI_FILE_PATH = str(TEST_DATASET_DIR.joinpath("green_tripdata_2020-04_with_index.csv").resolve())
+
+
+@pytest.fixture(scope="module")
+def spark() -> SparkSession:
+    """Generate a spark session for tests."""
+    # Set ui port other than the default one (4040) so that feathr spark job may not fail.
+    spark_session = SparkSession.builder.appName("tests").config("spark.ui.port", "8080").getOrCreate()
+    yield spark_session
+    spark_session.stop()
+
+
+@pytest.mark.parametrize(
+    "local_cache_path",
+    [
+        None,  # default temporary directory
+        NYC_TAXI_FILE_PATH,  # full filepath
+        str(Path(NYC_TAXI_FILE_PATH).parent),  # directory
+    ],
+)
+def test__nyc_taxi__get_pandas_df(
+    mocker: MockerFixture,
+    local_cache_path: str,
+):
+    """Test if nyc_taxi.get_pandas_df returns pd.DataFrame. Also check if the proper modules are being called."""
+    # Mock maybe_download and TempDirectory
+    mocked_maybe_download = mocker.patch("feathr.datasets.nyc_taxi.maybe_download")
+    mocked_tmpdir = MagicMock()
+    mocked_tmpdir.name = NYC_TAXI_FILE_PATH
+    mocked_TemporaryDirectory = mocker.patch("feathr.datasets.nyc_taxi.TemporaryDirectory", return_value=mocked_tmpdir)
+
+    pdf = nyc_taxi.get_pandas_df(local_cache_path=local_cache_path)
+    assert len(pdf) == 35612
+
+    # Assert mock called
+    if local_cache_path:
+        mocked_TemporaryDirectory.assert_not_called()
+    else:
+        mocked_TemporaryDirectory.assert_called_once()
+
+    # TODO check this is called w/ file extension added
+    mocked_maybe_download.assert_called_once_with(src_url=nyc_taxi.NYC_TAXI_SMALL_URL, dst_filepath=NYC_TAXI_FILE_PATH)
+
+
+@pytest.mark.parametrize(
+    "local_cache_path", [
+        NYC_TAXI_FILE_PATH,  # full filepath
+        str(Path(NYC_TAXI_FILE_PATH).parent),  # directory
+    ],
+)
+def test__nyc_taxi__get_spark_df(
+    spark,
+    mocker: MockerFixture,
+    local_cache_path: str,
+):
+    """Test if nyc_taxi.get_spark_df returns spark.sql.DataFrame."""
+    # Mock maybe_download
+    mocked_maybe_download = mocker.patch("feathr.datasets.nyc_taxi.maybe_download")
+
+    df = nyc_taxi.get_spark_df(spark=spark, local_cache_path=local_cache_path)
+    assert df.count() == 35612
+
+    mocked_maybe_download.assert_called_once_with(
+        src_url=nyc_taxi.NYC_TAXI_SMALL_URL, dst_filepath=NYC_TAXI_FILE_PATH
+    )
+
+
+@pytest.mark.parametrize(
+    "local_cache_path", [
+        NYC_TAXI_FILE_PATH,  # full filepath
+        str(Path(NYC_TAXI_FILE_PATH).parent),  # directory
+    ],
+)
+def test__nyc_taxi__get_spark_df__with_databricks(
+    mocker: MockerFixture,
+    local_cache_path: str,
+):
+    # Mock maybe_download and spark session
+    mocked_maybe_download = mocker.patch("feathr.datasets.nyc_taxi.maybe_download")
+    mocked_is_databricks = mocker.patch("feathr.datasets.nyc_taxi.is_databricks", return_value=True)
+    mocked_spark = MagicMock(spec=SparkSession)
+
+    nyc_taxi.get_spark_df(spark=mocked_spark, local_cache_path=local_cache_path)
+
+    # Assert mock called with databricks paths
+    mocked_is_databricks.assert_called_once()
+
+    expected_dst_filepath = str(Path("/dbfs", NYC_TAXI_FILE_PATH.lstrip("/")))
+    mocked_maybe_download.assert_called_once_with(
+        src_url=nyc_taxi.NYC_TAXI_SMALL_URL, dst_filepath=expected_dst_filepath
+    )
+
+    mocked_spark.read.option.return_value.csv.assert_called_once_with(
+        str(Path("dbfs:", NYC_TAXI_FILE_PATH.lstrip("/")))
+    )
diff --git a/feathr_project/test/unit/utils/test_config.py b/feathr_project/test/unit/utils/test_config.py
new file mode 100644
index 000000000..502a3a01d
--- /dev/null
+++ b/feathr_project/test/unit/utils/test_config.py
@@ -0,0 +1,31 @@
+from pathlib import Path
+from tempfile import NamedTemporaryFile
+
+import pytest
+
+from feathr.utils.config import FEATHR_CONFIG_TEMPLATE, generate_config
+
+
+@pytest.mark.parametrize(
+    "output_filepath", [None, NamedTemporaryFile().name],
+)
+def test__generate_config(output_filepath: str):
+
+    config = FEATHR_CONFIG_TEMPLATE.format(
+        resource_prefix="test_prefix",
+        project_name="test_project",
+        spark_cluster="local",
+    )
+
+    config_filepath = generate_config(
+        resource_prefix="test_prefix",
+        project_name="test_project",
+        spark_cluster="local",
+        output_filepath=output_filepath,
+    )
+
+    if output_filepath:
+        assert output_filepath == config_filepath
+
+    with open(config_filepath, "r") as f:
+        assert config == f.read()

From 9728e94d8c5d873bb43e0ef4e5ed5641d0ea3dbb Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Thu, 27 Oct 2022 16:06:36 +0800
Subject: [PATCH 42/68] UI: Display version (#779)

* UI: Display version

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Update the version of the package.json

* Update feathr_overall_release_guide.md

Signed-off-by: Boli Guan <ifendoe@gmail.com>
---
 .../dev_guide/feathr_overall_release_guide.md |  1 +
 ui/.eslintrc                                  |  1 -
 ui/craco.config.js                            | 28 ++++++++
 ui/package-lock.json                          |  8 ++-
 ui/package.json                               |  7 +-
 ui/src/app.tsx                                | 66 +++++++++++--------
 ui/src/components/footer/index.module.less    | 12 ++++
 ui/src/components/footer/index.tsx            | 25 +++++++
 ui/src/index.tsx                              |  4 ++
 ui/src/site.css                               |  3 +-
 10 files changed, 119 insertions(+), 36 deletions(-)
 create mode 100644 ui/src/components/footer/index.module.less
 create mode 100644 ui/src/components/footer/index.tsx

diff --git a/docs/dev_guide/feathr_overall_release_guide.md b/docs/dev_guide/feathr_overall_release_guide.md
index 0174c8dae..68902b2f8 100644
--- a/docs/dev_guide/feathr_overall_release_guide.md
+++ b/docs/dev_guide/feathr_overall_release_guide.md
@@ -36,6 +36,7 @@ Before the release is made, the version needs to be updated in following places
 - [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/test/test_user_workspace/feathr_config.yaml#L84) - To set the spark runtime location for Azure Synapse and Azure Databricks used by test suite. Please update all .yaml files under this path. 
 - [azure_resource_provision.json](https://github.com/feathr-ai/feathr/blob/main/docs/how-to-guides/azure_resource_provision.json#L114) - To set the deployment template to pull the latest release image.
 - [constants.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathr/constants.py#L31) - To set the default maven artifact version (Only needed when maven version is **NOT** the same as python sdk version)
+- [package.json](https://github.com/feathr-ai/feathr/blob/main/ui/package.json#L3) - For Feathr UI version
 
 ## Triggering automated release pipelines
 Our goal is to automate the release process as much as possible. So far, we have automated the following steps
diff --git a/ui/.eslintrc b/ui/.eslintrc
index 82eaebe00..43eeb60eb 100644
--- a/ui/.eslintrc
+++ b/ui/.eslintrc
@@ -35,7 +35,6 @@
       {
         "ts": "never",
         "tsx": "never",
-        "json": "never",
         "js": "never",
         "jsx": "never"
       }
diff --git a/ui/craco.config.js b/ui/craco.config.js
index 713372305..e44884899 100644
--- a/ui/craco.config.js
+++ b/ui/craco.config.js
@@ -3,8 +3,14 @@ const path = require("path");
 const { loaderByName } = require("@craco/craco");
 const CracoLessPlugin = require("craco-less");
 
+const webpack = require("webpack");
+
+const packageJson = require("./package.json");
+
 const resolve = (dir) => path.resolve(__dirname, dir);
 
+const currentTime = new Date();
+
 module.exports = {
   babel: {
     plugins: [
@@ -22,6 +28,28 @@ module.exports = {
     alias: {
       "@": resolve("src"),
     },
+    configure: (webpackConfig, { env, paths }) => {
+      const index = webpackConfig.plugins.findIndex(
+        (itme) => itme instanceof webpack.DefinePlugin
+      );
+
+      if (index > -1) {
+        const definePlugin = webpackConfig.plugins[index];
+        webpackConfig.plugins.splice(
+          index,
+          1,
+          new webpack.DefinePlugin({
+            "process.env": {
+              ...definePlugin.definitions["process.env"],
+              FEATHR_VERSION: JSON.stringify(packageJson.version),
+              FEATHR_GENERATED_TIME: JSON.stringify(currentTime.toISOString()),
+            },
+          })
+        );
+      }
+
+      return webpackConfig;
+    },
   },
   plugins: [
     {
diff --git a/ui/package-lock.json b/ui/package-lock.json
index eb39f7e78..b1568ad00 100644
--- a/ui/package-lock.json
+++ b/ui/package-lock.json
@@ -47,7 +47,8 @@
         "prettier": "2.7.1",
         "react-scripts": "5.0.0",
         "typescript": "^4.6.3",
-        "web-vitals": "^2.1.4"
+        "web-vitals": "^2.1.4",
+        "webpack": "^5.72.0"
       }
     },
     "node_modules/@ampproject/remapping": {
@@ -16793,8 +16794,9 @@
     },
     "node_modules/webpack": {
       "version": "5.72.0",
+      "resolved": "https://registry.npmjs.org/webpack/-/webpack-5.72.0.tgz",
+      "integrity": "sha512-qmSmbspI0Qo5ld49htys8GY9XhS9CGqFoHTsOVAnjBdg0Zn79y135R+k4IR4rKK6+eKaabMhJwiVB7xw0SJu5w==",
       "dev": true,
-      "license": "MIT",
       "dependencies": {
         "@types/eslint-scope": "^3.7.3",
         "@types/estree": "^0.0.51",
@@ -28101,6 +28103,8 @@
     },
     "webpack": {
       "version": "5.72.0",
+      "resolved": "https://registry.npmjs.org/webpack/-/webpack-5.72.0.tgz",
+      "integrity": "sha512-qmSmbspI0Qo5ld49htys8GY9XhS9CGqFoHTsOVAnjBdg0Zn79y135R+k4IR4rKK6+eKaabMhJwiVB7xw0SJu5w==",
       "dev": true,
       "requires": {
         "@types/eslint-scope": "^3.7.3",
diff --git a/ui/package.json b/ui/package.json
index 41c6d142a..0cd3f6b7e 100644
--- a/ui/package.json
+++ b/ui/package.json
@@ -1,6 +1,6 @@
 {
   "name": "feathr-ui",
-  "version": "0.1.0",
+  "version": "0.8.0",
   "private": true,
   "dependencies": {
     "@ant-design/icons": "^4.7.0",
@@ -21,7 +21,7 @@
     "@craco/craco": "^7.0.0-alpha.8",
     "@testing-library/jest-dom": "^5.16.3",
     "@testing-library/react": "^12.1.4",
-    "@testing-library/user-event": "^13.5.0", 
+    "@testing-library/user-event": "^13.5.0",
     "@types/dagre": "^0.7.47",
     "@types/jest": "^27.5.0",
     "@types/node": "^16.11.26",
@@ -42,7 +42,8 @@
     "prettier": "2.7.1",
     "react-scripts": "5.0.0",
     "typescript": "^4.6.3",
-    "web-vitals": "^2.1.4"
+    "web-vitals": "^2.1.4",
+    "webpack": "^5.72.0"
   },
   "scripts": {
     "start": "craco start",
diff --git a/ui/src/app.tsx b/ui/src/app.tsx
index 5984717f9..8b43cc70a 100644
--- a/ui/src/app.tsx
+++ b/ui/src/app.tsx
@@ -20,48 +20,56 @@ import RoleManagement from "./pages/management/roleManagement";
 import Home from "./pages/home/home";
 import Projects from "./pages/project/projects";
 import { getMsalConfig } from "./utils/utils";
+import Footer from "@/components/footer";
 
 const queryClient = new QueryClient();
 
 const msalClient = getMsalConfig();
+
 const App = () => {
   return (
     <MsalProvider instance={msalClient}>
       <MsalAuthenticationTemplate interactionType={InteractionType.Redirect}>
         <QueryClientProvider client={queryClient}>
           <BrowserRouter>
-            <Layout style={{ minHeight: "100vh" }}>
+            <Layout style={{ minHeight: "100vh", position: "relative" }}>
               <SideMenu />
               <Layout>
                 <Header />
-                <Routes>
-                  <Route index element={<Home />} />
-                  <Route path="/home" element={<Home />} />
-                  <Route path="/projects" element={<Projects />} />
-                  <Route path="/dataSources" element={<DataSources />} />
-                  <Route path="/features" element={<Features />} />
-                  <Route path="/new-feature" element={<NewFeature />} />
-                  <Route
-                    path="/projects/:project/features/:featureId"
-                    element={<FeatureDetails />}
-                  />
-                  <Route
-                    path="/projects/:project/dataSources/:dataSourceId"
-                    element={<DataSourceDetails />}
-                  />
-                  <Route
-                    path="/projects/:project/lineage"
-                    element={<LineageGraph />}
-                  />
-                  <Route path="/jobs" element={<Jobs />} />
-                  <Route path="/monitoring" element={<Monitoring />} />
-                  <Route path="/management" element={<Management />} />
-                  <Route path="/role-management" element={<RoleManagement />} />
-                  <Route
-                    path="/responseErrors/:status/:detail"
-                    element={<ResponseErrors />}
-                  />
-                </Routes>
+                <Layout.Content>
+                  <Routes>
+                    <Route index element={<Home />} />
+                    <Route path="/home" element={<Home />} />
+                    <Route path="/projects" element={<Projects />} />
+                    <Route path="/dataSources" element={<DataSources />} />
+                    <Route path="/features" element={<Features />} />
+                    <Route path="/new-feature" element={<NewFeature />} />
+                    <Route
+                      path="/projects/:project/features/:featureId"
+                      element={<FeatureDetails />}
+                    />
+                    <Route
+                      path="/projects/:project/dataSources/:dataSourceId"
+                      element={<DataSourceDetails />}
+                    />
+                    <Route
+                      path="/projects/:project/lineage"
+                      element={<LineageGraph />}
+                    />
+                    <Route path="/jobs" element={<Jobs />} />
+                    <Route path="/monitoring" element={<Monitoring />} />
+                    <Route path="/management" element={<Management />} />
+                    <Route
+                      path="/role-management"
+                      element={<RoleManagement />}
+                    />
+                    <Route
+                      path="/responseErrors/:status/:detail"
+                      element={<ResponseErrors />}
+                    />
+                  </Routes>
+                </Layout.Content>
+                <Footer />
               </Layout>
             </Layout>
           </BrowserRouter>
diff --git a/ui/src/components/footer/index.module.less b/ui/src/components/footer/index.module.less
new file mode 100644
index 000000000..ddf5db66a
--- /dev/null
+++ b/ui/src/components/footer/index.module.less
@@ -0,0 +1,12 @@
+.footer {
+  position: fixed;
+  bottom: 0;
+  left: 200px;
+  right: 0;
+  padding: 16px;
+  text-align: center;
+  border-top: 1px solid rgba(0, 0, 0, 0.06);
+  background-color: rgb(240 242 245 / 40%);
+  backdrop-filter: blur(8px);
+  z-index: 10;
+}
diff --git a/ui/src/components/footer/index.tsx b/ui/src/components/footer/index.tsx
new file mode 100644
index 000000000..8cc36c40d
--- /dev/null
+++ b/ui/src/components/footer/index.tsx
@@ -0,0 +1,25 @@
+import React from "react";
+
+import { Layout, Space } from "antd";
+import dayjs from "dayjs";
+
+import styles from "./index.module.less";
+
+const { Footer } = Layout;
+
+const FooterBar = () => {
+  const generatedTime = dayjs(process.env.FEATHR_GENERATED_TIME)
+    .utc()
+    .format("YYYY-MM-DD HH:mm:DD UTC");
+
+  return (
+    <Footer className={styles.footer}>
+      <Space size={32}>
+        <span>version {process.env.FEATHR_VERSION}</span>
+        <span> generated at {generatedTime}</span>
+      </Space>
+    </Footer>
+  );
+};
+
+export default FooterBar;
diff --git a/ui/src/index.tsx b/ui/src/index.tsx
index 4161e13b2..994169b55 100644
--- a/ui/src/index.tsx
+++ b/ui/src/index.tsx
@@ -1,8 +1,12 @@
 import React from "react";
 import ReactDOM from "react-dom";
+import dayjs from "dayjs";
+import utc from "dayjs/plugin/utc";
 import App from "./app";
 import "./site.css";
 
+dayjs.extend(utc);
+
 ReactDOM.render(
   <React.StrictMode>
     <App />
diff --git a/ui/src/site.css b/ui/src/site.css
index 2d90b28bf..cea4439f7 100644
--- a/ui/src/site.css
+++ b/ui/src/site.css
@@ -1,5 +1,6 @@
 .page {
-  margin: 1%;
+  margin: 16px;
+  padding-bottom: 100px;
 }
 
 .card {

From 58395a8e9c78baa466a9451a0fb74d60bd14c0bd Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Fri, 28 Oct 2022 00:54:11 +0800
Subject: [PATCH 43/68] Add nightly Notification to PR Test GitHub Action
 (#783)

* add nightly notification to test

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

add daily notification to pr test

* update message

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 .github/workflows/pull_request_push_test.yml | 28 +++++++++++++++-----
 1 file changed, 21 insertions(+), 7 deletions(-)

diff --git a/.github/workflows/pull_request_push_test.yml b/.github/workflows/pull_request_push_test.yml
index 1600d102b..1e65e7a9f 100644
--- a/.github/workflows/pull_request_push_test.yml
+++ b/.github/workflows/pull_request_push_test.yml
@@ -22,11 +22,15 @@ on:
       - "docs/**"
       - "ui/**"
       - "**/README.md"
+  
+  schedule:
+    # Runs daily at 1 PM UTC (9 PM CST), will send notification to TEAMS_WEBHOOK
+    - cron: '00 13 * * *'
 
 jobs:
   sbt_test:
     runs-on: ubuntu-latest
-    if: github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
+    if: github.event_name == 'schedule' || github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
     steps:
       - uses: actions/checkout@v2
         with:
@@ -41,7 +45,7 @@ jobs:
 
   python_lint:
     runs-on: ubuntu-latest
-    if: github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
+    if: github.event_name == 'schedule' || github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
     steps:
       - name: Set up Python 3.8
         uses: actions/setup-python@v2
@@ -61,7 +65,7 @@ jobs:
 
   databricks_test:
     runs-on: ubuntu-latest
-    if: github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
+    if: github.event_name == 'schedule' || github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
     steps:
       - uses: actions/checkout@v2
         with:
@@ -122,7 +126,6 @@ jobs:
           COSMOS1_KEY: ${{secrets.COSMOS1_KEY}}
           SQL1_USER: ${{secrets.SQL1_USER}}
           SQL1_PASSWORD: ${{secrets.SQL1_PASSWORD}}
-
         run: |
           # run only test with databricks. run in 4 parallel jobs
           pytest -n 6 feathr_project/test/
@@ -130,7 +133,7 @@ jobs:
   azure_synapse_test:
     # might be a bit duplication to setup both the azure_synapse test and databricks test, but for now we will keep those to accelerate the test speed
     runs-on: ubuntu-latest
-    if: github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
+    if: github.event_name == 'schedule' || github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
     steps:
       - uses: actions/checkout@v2
         with:
@@ -198,7 +201,7 @@ jobs:
 
   local_spark_test:
     runs-on: ubuntu-latest
-    if: github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
+    if: github.event_name == 'schedule' || github.event_name == 'push' || github.event_name == 'pull_request' || (github.event_name == 'pull_request_target' && contains(github.event.pull_request.labels.*.name, 'safe to test'))
     steps:
       - uses: actions/checkout@v2
         with:
@@ -252,4 +255,15 @@ jobs:
           SQL1_PASSWORD: ${{secrets.SQL1_PASSWORD}}
         run: |
           # skip cloud related tests
-          pytest feathr_project/test/test_local_spark_e2e.py
\ No newline at end of file
+          pytest feathr_project/test/test_local_spark_e2e.py
+
+  notification:
+    needs: [sbt_test, python_lint, databricks_test, azure_synapse_test, local_spark_test]
+    runs-on: ubuntu-latest
+    if: always() && github.event_name == 'schedule'
+    steps:
+      - name: Get Date
+        run: echo "NOW=$(date +'%Y-%m-%d')" >> $GITHUB_ENV
+      - name: Notification
+        run: |
+          curl -H 'Content-Type: application/json' -d '{"text": "${{env.NOW}} Daily Report: 1. SBT Test ${{needs.sbt_test.result}}, 2. Python Lint Test ${{needs.python_lint.result}}, 3. Databricks Test ${{needs.databricks_test.result}}, 4. Synapse Test ${{needs.azure_synapse_test.result}} , 5. LOCAL SPARK TEST ${{needs.local_spark_test.result}}"}' ${{ secrets.TEAMS_WEBHOOK }}
\ No newline at end of file

From 70618c4580865f8029f0fbf7b86e521bfa05781a Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Fri, 28 Oct 2022 14:40:33 +0800
Subject: [PATCH 44/68] fix broken links for #743 (#789)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 docs/README.md                                          | 2 +-
 docs/concepts/feature-registry.md                       | 2 +-
 docs/dev_guide/feathr_overall_release_guide.md          | 2 +-
 docs/quickstart_synapse.md                              | 6 +++---
 docs/samples/product_recommendation_demo_advanced.ipynb | 2 +-
 5 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/docs/README.md b/docs/README.md
index 1a797ce48..ca67ed446 100644
--- a/docs/README.md
+++ b/docs/README.md
@@ -159,7 +159,7 @@ Read [Point-in-time Correctness and Point-in-time Join in Feathr](https://feathr
 
 ### Running Feathr Examples
 
-Follow the [quick start Jupyter Notebook](./samples/product_recommendation_demo.ipynb) to try it out. There is also a companion [quick start guide](https://feathr-ai.github.io/feathr/quickstart_synapse.html) containing a bit more explanation on the notebook.
+Follow the [quick start Jupyter Notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb) to try it out. There is also a companion [quick start guide](https://feathr-ai.github.io/feathr/quickstart_synapse.html) containing a bit more explanation on the notebook.
 
 ## 🗣️ Tech Talks on Feathr
 
diff --git a/docs/concepts/feature-registry.md b/docs/concepts/feature-registry.md
index 112fa1c4b..e78c0e605 100644
--- a/docs/concepts/feature-registry.md
+++ b/docs/concepts/feature-registry.md
@@ -80,7 +80,7 @@ Please avoid applying a same name to different features under a certain project.
 
 The feature producers can just let the feature consumers know which features exist so the feature consumers can reuse them. For feature consumers, they can reuse existing features from the registry. The whole project can be retrieved to local environment by calling this API `client.get_features_from_registry` with a project name. This encourage feature reuse across organizations. For example, end users of a feature just need to read all feature definitions from the existing projects, then use a few features from the projects and join those features with a new dataset you have.
 
-For example, in the [product recommendation demo notebook](./../samples/product_recommendation_demo.ipynb), some other team members have already defined a few features, such as `feature_user_gift_card_balance` and `feature_user_has_valid_credit_card`. If we want to reuse those features for anti-abuse purpose in a new dataset, what you can do is like this, i.e. just call `get_features_from_registry` to get the features, then put the features you want to query to the anti-abuse dataset you have.
+For example, in the [product recommendation demo notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb), some other team members have already defined a few features, such as `feature_user_gift_card_balance` and `feature_user_has_valid_credit_card`. If we want to reuse those features for anti-abuse purpose in a new dataset, what you can do is like this, i.e. just call `get_features_from_registry` to get the features, then put the features you want to query to the anti-abuse dataset you have.
 
 ```python
 registered_features_dict = client.get_features_from_registry(client.project_name)
diff --git a/docs/dev_guide/feathr_overall_release_guide.md b/docs/dev_guide/feathr_overall_release_guide.md
index 68902b2f8..0a3bfdf2c 100644
--- a/docs/dev_guide/feathr_overall_release_guide.md
+++ b/docs/dev_guide/feathr_overall_release_guide.md
@@ -67,7 +67,7 @@ The automated workflow should take care of this, you can check under [actions](h
 The automated workflow should take care of this as well, you can check under [actions](https://github.com/feathr-ai/feathr/actions/workflows/docker-publish.yml) to see the triggered run and results. For manual steps, see [Feathr Registry docker image](https://feathr-ai.github.io/feathr/dev_guide/build-and-push-feathr-registry-docker-image.html)
 
 ## Testing
-Run one of the sample [notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/product_recommendation_demo.ipynb) as it uses the latest package from Maven and PyPi.
+Run one of the sample [notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb) as it uses the latest package from Maven and PyPi.
 
 ## Announcement
 
diff --git a/docs/quickstart_synapse.md b/docs/quickstart_synapse.md
index 5c5a2ca29..c310dd789 100644
--- a/docs/quickstart_synapse.md
+++ b/docs/quickstart_synapse.md
@@ -43,7 +43,7 @@ pip install git+https://github.com/feathr-ai/feathr.git#subdirectory=feathr_proj
 
 ## Step 3: Run the sample notebook
 
-We've provided a self-contained [sample notebook](./samples/product_recommendation_demo.ipynb) to act as the main content of this getting started guide. This documentation should be used more like highlights and further explanations of that demo notebook.
+We've provided a self-contained [sample notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb) to act as the main content of this getting started guide. This documentation should be used more like highlights and further explanations of that demo notebook.
 
 ## Step 4: Update Feathr config
 
@@ -88,7 +88,7 @@ os.environ['ONLINE_STORE__REDIS__HOST'] = 'feathrazure.redis.cache.windows.net'
 
 ## Step 5: Setup environment variables
 
-In the self-contained [sample notebook](./samples/product_recommendation_demo.ipynb), you also have to setup a few environment variables like below in order to access those cloud resources. You should be able to get those values from the first step.
+In the self-contained [sample notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb), you also have to setup a few environment variables like below in order to access those cloud resources. You should be able to get those values from the first step.
 
 These values can also be retrieved by using cloud key value store, such as [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/):
 
@@ -181,7 +181,7 @@ client.multi_get_online_features("nycTaxiDemoFeature", ["239", "265"], ['f_locat
 
 ## Next steps
 
-- Run the [demo notebook](./samples/product_recommendation_demo.ipynb) to understand the workflow of Feathr.
+- Run the [demo notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb) to understand the workflow of Feathr.
 - Read the [Feathr Documentation Page](https://feathr-ai.github.io/feathr/) page to understand the Feathr abstractions.
 - Read guide to understand [how to setup Feathr on Azure using Azure Resource Manager template](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html).
 - Read guide to understand [how to setup Feathr step by step on Azure using Azure CLI](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html).
diff --git a/docs/samples/product_recommendation_demo_advanced.ipynb b/docs/samples/product_recommendation_demo_advanced.ipynb
index b03dccac6..169d0f0ad 100644
--- a/docs/samples/product_recommendation_demo_advanced.ipynb
+++ b/docs/samples/product_recommendation_demo_advanced.ipynb
@@ -20,7 +20,7 @@
             "\n",
             "After the model is trained, given a user_id, product_id pair and features, we should be able to predict the product rating that the user will give for this product_id.\n",
             "\n",
-            "(Compared with [the beginner version of product recommendation](product_recommendation_demo.ipynb), this tutorial expanded the example by predicting ratings for all products.)\n",
+            "(Compared with [the beginner version of product recommendation](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb), this tutorial expanded the example by predicting ratings for all products.)\n",
             "\n",
             "## Feature Creation Illustration\n",
             "In this example, our observation data has compound entity key where a record is uniquely identified by user_id and product_id. So there might be 3 types of features:\n",

From 3b64c8e35d57c6e1fa5baaebf67398c125c18515 Mon Sep 17 00:00:00 2001
From: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
Date: Sat, 29 Oct 2022 00:42:45 -0700
Subject: [PATCH 45/68] Update notebook image links for github rendering (#787)

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
---
 .../databricks/databricks_quickstart_nyc_taxi_demo.ipynb        | 2 +-
 docs/samples/nyc_taxi_demo.ipynb                                | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
index d5d7152d1..13187aa44 100755
--- a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
+++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
@@ -1 +1 @@
-{"cells":[{"cell_type":"code","source":["dbutils.widgets.text(\"RESOURCE_PREFIX\", \"\")\ndbutils.widgets.text(\"REDIS_KEY\", \"\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"843d3142-24ca-4bd1-9e31-b55163804fe3"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["# Feathr Feature Store on Databricks Demo Notebook\n\nThis notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n\nThis notebook is specifically written for Databricks and is relying on some of the Databricks packages such as `dbutils`. The intention here is to provide a \"one click run\" example with minimum configuration. For example:\n- This notebook skips feature registry which requires running Azure Purview. \n- To make the online feature query work, you will need to configure the Redis endpoint. \n\nThe full-fledged notebook can be found from [here](https://github.com/feathr-ai/feathr/blob/main/docs/samples/nyc_taxi_demo.ipynb)."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"384e5e16-7213-4186-9d04-09d03b155534"}}},{"cell_type":"markdown","source":["## Prerequisite\n\nTo use feathr materialization for online scoring with Redis cache, you may deploy a Redis cluster and set `RESOURCE_PREFIX` and `REDIS_KEY` via Databricks widgets. Note that the deployed Redis host address should be `{RESOURCE_PREFIX}redis.redis.cache.windows.net`. More details about how to deploy the Redis cluster can be found [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html#configurure-redis-cluster).\n\nTo run this notebook, you'll need to install `feathr` pip package. Here, we install notebook-scoped library. For details, please see [Azure Databricks dependency management document](https://learn.microsoft.com/en-us/azure/databricks/libraries/)."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c2ce58c7-9263-469a-bbb7-43364ddb07b8"}}},{"cell_type":"code","source":["!pip install feathr"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"4609d7ad-ad74-40fc-b97e-f440a0fa0737"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## Notebook Steps\n\nThis tutorial demonstrates the key capabilities of Feathr, including:\n\n1. Install Feathr and necessary dependencies.\n1. Create shareable features with Feathr feature definition configs.\n1. Create training data using point-in-time correct feature join\n1. Train and evaluate a prediction model.\n1. Materialize feature values for online scoring.\n\nThe overall data flow is as follows:\n\n<img src=\"https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true\" width=\"800\">"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c81fa80c-bca6-4ae5-84ad-659a036977bd"}}},{"cell_type":"code","source":["from datetime import datetime, timedelta\nimport glob\nimport json\nfrom math import sqrt\nimport os\nfrom pathlib import Path\nimport requests\nfrom tempfile import TemporaryDirectory\n\nfrom azure.identity import AzureCliCredential, DefaultAzureCredential \nfrom azure.keyvault.secrets import SecretClient\nimport pandas as pd\nfrom pyspark.ml import Pipeline\nfrom pyspark.ml.evaluation import RegressionEvaluator\nfrom pyspark.ml.feature import VectorAssembler\nfrom pyspark.ml.regression import GBTRegressor\nfrom pyspark.sql import DataFrame, SparkSession\nimport pyspark.sql.functions as F\n\nimport feathr\nfrom feathr import (\n    FeathrClient,\n    # Feature data types\n    BOOLEAN, FLOAT, INT32, ValueType,\n    # Feature data sources\n    INPUT_CONTEXT, HdfsSource,\n    # Feature aggregations\n    TypedKey, WindowAggTransformation,\n    # Feature types and anchor\n    DerivedFeature, Feature, FeatureAnchor,\n    # Materialization\n    BackfillTime, MaterializationSettings, RedisSink,\n    # Offline feature computation\n    FeatureQuery, ObservationSettings,\n)\nfrom feathr.datasets import nyc_taxi\nfrom feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\nfrom feathr.utils.config import generate_config\nfrom feathr.utils.job_utils import get_result_df\n\n\nprint(f\"\"\"Feathr version: {feathr.__version__}\nDatabricks runtime version: {spark.conf.get(\"spark.databricks.clusterUsageTags.sparkVersion\")}\"\"\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"80223a02-631c-40c8-91b3-a037249ffff9"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 2. Create Shareable Features with Feathr Feature Definition Configs\n\nIn this notebook, we define all the necessary resource key values for authentication. We use the values passed by the databricks widgets at the top of this notebook. Instead of manually entering the values to the widgets, we can also use [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) to retrieve them.\nPlease refer to [how-to guide documents for granting key-vault access](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html#3-grant-key-vault-and-synapse-access-to-selected-users-optional) and [Databricks' Azure Key Vault-backed scopes](https://learn.microsoft.com/en-us/azure/databricks/security/secrets/secret-scopes) for more details."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"ab35fa01-b392-457e-8fde-7e445a3c39b5"}}},{"cell_type":"code","source":["RESOURCE_PREFIX = dbutils.widgets.get(\"RESOURCE_PREFIX\")\nPROJECT_NAME = \"feathr_getting_started\"\n\nREDIS_KEY = dbutils.widgets.get(\"REDIS_KEY\")\n\n# Use a databricks cluster\nSPARK_CLUSTER = \"databricks\"\n\n# Databricks file system path\nDATA_STORE_PATH = f\"dbfs:/{PROJECT_NAME}\""],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"09f93a9f-7b33-4d91-8f31-ee3b20991696"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["In the following cell, we set required databricks credentials automatically by using a databricks notebook context object as well as new job cluster spec.\n\nNote: When submitting jobs, Databricks recommend to use new clusters for greater reliability. If you want to use an existing all-purpose cluster, you may set\n`existing_cluster_id': ctx.tags().get('clusterId').get()` to the `databricks_config`, replacing `new_cluster` config values."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"41d3648a-9bc9-40dc-90da-bc82b21ef9b3"}}},{"cell_type":"code","source":["# Redis credential\nos.environ['REDIS_PASSWORD'] = REDIS_KEY\n\n# Setup databricks env configs\nctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\ndatabricks_config = {\n    'run_name': \"FEATHR_FILL_IN\",\n    # To use an existing all-purpose cluster:\n    # 'existing_cluster_id': ctx.tags().get('clusterId').get(),\n    # To use a new job cluster:\n    'new_cluster': {\n        'spark_version': \"11.2.x-scala2.12\",\n        'node_type_id': \"Standard_D3_v2\",\n        'num_workers':1,\n        'spark_conf': {\n            'FEATHR_FILL_IN': \"FEATHR_FILL_IN\",\n            # Exclude conflicting packages if use feathr <= v0.8.0:\n            'spark.jars.excludes': \"commons-logging:commons-logging,org.slf4j:slf4j-api,com.google.protobuf:protobuf-java,javax.xml.bind:jaxb-api\",\n        },\n    },\n    'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n    'spark_jar_task': {\n        'main_class_name': \"FEATHR_FILL_IN\",\n        'parameters': [\"FEATHR_FILL_IN\"],\n    },\n}\nos.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\nos.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\nos.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\nos.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"331753d6-1850-47b5-ad97-84b7c01d79d1"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Configurations\n\nFeathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee"}}},{"cell_type":"code","source":["config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n\nwith open(config_path, 'r') as f: \n    print(f.read())"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"8cd64e3a-376c-48e6-ba41-5197f3591d48"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"58d22dc1-7590-494d-94ca-3e2488c31c8e"}}},{"cell_type":"markdown","source":["### Initialize Feathr Client"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"3fef7f2f-df19-4f53-90a5-ff7999ed983d"}}},{"cell_type":"code","source":["client = FeathrClient(config_path=config_path)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"9713a2df-c7b2-4562-88b0-b7acce3cc43a"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### View the NYC taxi fare dataset"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c3b64bda-d42c-4a64-b976-0fb604cf38c5"}}},{"cell_type":"code","source":["DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n\n# Download the data file\ndf_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\ndf_raw.limit(5).toPandas()"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"c4ccd7b3-298a-4e5a-8eec-b7e309db393e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Defining features with Feathr\n\nIn Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n\n* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n\nNote that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n\nThere are two types of features -- anchored features and derivated features:\n\n* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n* **Derived features**: Features that are computed on top of other features.\n\n#### Define anchored features\n\nA feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"7430c942-64e5-4b70-b823-16ce1d1b3cee"}}},{"cell_type":"code","source":["TIMESTAMP_COL = \"lpep_dropoff_datetime\"\nTIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"75b8d2ed-84df-4446-ae07-5f715434f3ea"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# We define f_trip_distance and f_trip_time_duration features separately\n# so that we can reuse them later for the derived features.\nf_trip_distance = Feature(\n    name=\"f_trip_distance\",\n    feature_type=FLOAT,\n    transform=\"trip_distance\",\n)\nf_trip_time_duration = Feature(\n    name=\"f_trip_time_duration\",\n    feature_type=FLOAT,\n    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n)\n\nfeatures = [\n    f_trip_distance,\n    f_trip_time_duration,\n    Feature(\n        name=\"f_is_long_trip_distance\",\n        feature_type=BOOLEAN,\n        transform=\"trip_distance > 30.0\",\n    ),\n    Feature(\n        name=\"f_day_of_week\",\n        feature_type=INT32,\n        transform=\"dayofweek(lpep_dropoff_datetime)\",\n    ),\n    Feature(\n        name=\"f_day_of_month\",\n        feature_type=INT32,\n        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n    ),\n    Feature(\n        name=\"f_hour_of_day\",\n        feature_type=INT32,\n        transform=\"hour(lpep_dropoff_datetime)\",\n    ),\n]\n\n# After you have defined features, bring them together to build the anchor to the source.\nfeature_anchor = FeatureAnchor(\n    name=\"feature_anchor\",\n    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n    features=features,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"93abbcc2-562b-47e4-ad4c-1fedd7cc64df"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["We can define the source with a preprocessing python function."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"728d2d5f-c11f-4941-bdc5-48507f5749f1"}}},{"cell_type":"code","source":["def preprocessing(df: DataFrame) -> DataFrame:\n    import pyspark.sql.functions as F\n    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n    return df\n\nbatch_source = HdfsSource(\n    name=\"nycTaxiBatchSource\",\n    path=DATA_FILE_PATH,\n    event_timestamp_column=TIMESTAMP_COL,\n    preprocessing=preprocessing,\n    timestamp_format=TIMESTAMP_FORMAT,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"3cc59a0e-a41b-480e-a84e-ca5443d63143"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["For the features with aggregation, the supported functions are as follows:\n\n| Aggregation Function | Input Type | Description |\n| --- | --- | --- |\n|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n|LATEST| Any |Returns the latest not-null values from within the defined time window |"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"46f863c4-bb81-434a-a448-6b585031a221"}}},{"cell_type":"code","source":["agg_key = TypedKey(\n    key_column=\"DOLocationID\",\n    key_column_type=ValueType.INT32,\n    description=\"location id in NYC\",\n    full_name=\"nyc_taxi.location_id\",\n)\n\nagg_window = \"90d\"\n\n# Anchored features with aggregations\nagg_features = [\n    Feature(\n        name=\"f_location_avg_fare\",\n        key=agg_key,\n        feature_type=FLOAT,\n        transform=WindowAggTransformation(\n            agg_expr=\"fare_amount_cents\",\n            agg_func=\"AVG\",\n            window=agg_window,\n        ),\n    ),\n    Feature(\n        name=\"f_location_max_fare\",\n        key=agg_key,\n        feature_type=FLOAT,\n        transform=WindowAggTransformation(\n            agg_expr=\"fare_amount_cents\",\n            agg_func=\"MAX\",\n            window=agg_window,\n        ),\n    ),\n]\n\nagg_feature_anchor = FeatureAnchor(\n    name=\"agg_feature_anchor\",\n    source=batch_source,  # External data source for feature. Typically a data table.\n    features=agg_features,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"a373ecbe-a040-4cd3-9d87-0d5f4c5ba553"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["#### Define derived features\n\nWe also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"149f85e2-fa3c-4895-b0c5-de5543ca9b6d"}}},{"cell_type":"code","source":["derived_features = [\n    DerivedFeature(\n        name=\"f_trip_time_distance\",\n        feature_type=FLOAT,\n        input_features=[\n            f_trip_distance,\n            f_trip_time_duration,\n        ],\n        transform=\"f_trip_distance / f_trip_time_duration\",\n    )\n]"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"05633bc3-9118-449b-9562-45fc437576c2"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Build features\n\nFinally, we build the features."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"ad102c45-586d-468c-85f0-9454401ef10b"}}},{"cell_type":"code","source":["client.build_features(\n    anchor_list=[feature_anchor, agg_feature_anchor],\n    derived_feature_list=derived_features,\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"91bb5ebb-87e4-470b-b8eb-1c89b351740e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 3. Create Training Data Using Point-in-Time Correct Feature Join\n\nAfter the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n\nTo create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\nwhat features and how these features should be joined to the observation data. \n\nTo learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"632d5f46-f9e2-41a8-aab7-34f75206e2aa"}}},{"cell_type":"code","source":["feature_names = [feature.name for feature in features + agg_features + derived_features]\nfeature_names"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"02feabc9-2f2f-43e8-898d-b28082798e98"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["DATA_FORMAT = \"parquet\"\noffline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# Features that we want to request. Can use a subset of features\nquery = FeatureQuery(\n    feature_list=feature_names,\n    key=agg_key,\n)\nsettings = ObservationSettings(\n    observation_path=DATA_FILE_PATH,\n    event_timestamp_column=TIMESTAMP_COL,\n    timestamp_format=TIMESTAMP_FORMAT,\n)\nclient.get_offline_features(\n    observation_settings=settings,\n    feature_query=query,\n    # Note, execution_configurations argument only works when using a new job cluster\n    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n    execution_configurations=SparkExecutionConfiguration({\n        \"spark.feathr.outputFormat\": DATA_FORMAT,\n    }),\n    output_path=offline_features_path,\n)\n\nclient.wait_job_to_finish(timeout_sec=500)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"67e81466-c736-47ba-b122-e640642c01cf"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# Show feature results\ndf = get_result_df(\n    spark=spark,\n    client=client,\n    data_format=\"parquet\",\n    res_url=offline_features_path,\n)\ndf.select(feature_names).limit(5).toPandas()"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"9871af55-25eb-41ee-a58a-fda74b1a174e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 4. Train and Evaluate a Prediction Model\n\nAfter generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n\nNote that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f"}}},{"cell_type":"markdown","source":["### Load Train and Test Data from the Offline Feature Values"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"5a226026-1c7b-48db-8f91-88d5c2ddf023"}}},{"cell_type":"code","source":["# Train / test split\ntrain_df, test_df = (\n    df  # Dataframe that we generated from get_offline_features call.\n    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n    .where(F.col(\"f_trip_time_duration\") > 0)\n    .fillna(0)\n    .randomSplit([0.8, 0.2])\n)\n\nprint(f\"Num train samples: {train_df.count()}\")\nprint(f\"Num test samples: {test_df.count()}\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"bd2cdc83-0920-46e8-9454-e5e6e7832ce0"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Build a ML Pipeline\n\nHere, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd"}}},{"cell_type":"code","source":["# Generate a feature vector column for SparkML\nvector_assembler = VectorAssembler(\n    inputCols=[x for x in df.columns if x in feature_names],\n    outputCol=\"features\",\n)\n\n# Define a model\ngbt = GBTRegressor(\n    featuresCol=\"features\",\n    maxIter=100,\n    maxDepth=5,\n    maxBins=16,\n)\n\n# Create a ML pipeline\nml_pipeline = Pipeline(stages=[\n    vector_assembler,\n    gbt,\n])"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"2a254361-63e9-45b2-8c19-40549762eacb"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["### Train and Evaluate the Model"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"bef93538-9591-4247-97b6-289d2055b7b1"}}},{"cell_type":"code","source":["# Train a model\nmodel = ml_pipeline.fit(train_df)\n\n# Make predictions\npredictions = model.transform(test_df)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"0c3d5f35-11a3-4644-9992-5860169d8302"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# Evaluate\nevaluator = RegressionEvaluator(\n    labelCol=\"label\",\n    predictionCol=\"prediction\",\n)\n\nrmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\nmae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\nprint(f\"RMSE: {rmse}\\nMAE: {mae}\")"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"1f9b584c-6228-4a02-a6c3-9b8dd2b78091"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\npredictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n\npredictions_pdf.plot(\n    x=\"index\",\n    y=[\"label\", \"prediction\"],\n    style=['-', ':'],\n    figsize=(20, 10),\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"25c33abd-6e87-437d-a6a1-86435f065a1e"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["predictions_pdf.plot.scatter(\n    x=\"label\",\n    y=\"prediction\",\n    xlim=(0, 100),\n    ylim=(0, 100),\n    figsize=(10, 10),\n)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"664d78cc-4a92-430c-9e05-565ba904558e"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## 5. Materialize Feature Values for Online Scoring\n\nWhile we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n\nNote, only the features anchored to offline data source can be materialized."],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"8a56d165-c813-4ce0-8ae6-9f4d313c463d"}}},{"cell_type":"code","source":["materialized_feature_names = [feature.name for feature in agg_features]\nmaterialized_feature_names"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"751fa72e-8f94-40a1-994e-3e8315b51d37"}},"outputs":[],"execution_count":0},{"cell_type":"code","source":["if REDIS_KEY and RESOURCE_PREFIX:\n    FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n\n    # Get the last date from the dataset\n    backfill_timestamp = (\n        df_raw\n        .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n        .agg({TIMESTAMP_COL: \"max\"})\n        .collect()[0][0]\n    )\n\n    # Time range to materialize\n    backfill_time = BackfillTime(\n        start=backfill_timestamp,\n        end=backfill_timestamp,\n        step=timedelta(days=1),\n    )\n\n    # Destinations:\n    # For online store,\n    redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n\n    # For offline store,\n    # adls_sink = HdfsSink(output_path=)\n\n    settings = MaterializationSettings(\n        name=FEATURE_TABLE_NAME + \".job\",  # job name\n        backfill_time=backfill_time,\n        sinks=[redis_sink],  # or adls_sink\n        feature_names=materialized_feature_names,\n    )\n\n    client.materialize_features(\n        settings=settings,\n        # Note, execution_configurations argument only works when using a new job cluster\n        execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n    )\n\n    client.wait_job_to_finish(timeout_sec=500)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"4d4699ed-42e6-408f-903d-2f799284f4b6"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["Now, you can retrieve features for online scoring as follows:"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"5aa13acd-58ec-4fc2-86bb-dc1d9951ebb9"}}},{"cell_type":"code","source":["if REDIS_KEY and RESOURCE_PREFIX:\n    # Note, to get a single key, you may use client.get_online_features instead\n    materialized_feature_values = client.multi_get_online_features(\n        feature_table=FEATURE_TABLE_NAME,\n        keys=[\"239\", \"265\"],\n        feature_names=materialized_feature_names,\n    )\n    materialized_feature_values"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"424bc9eb-a47f-4b46-be69-8218d55e66ad"}},"outputs":[],"execution_count":0},{"cell_type":"markdown","source":["## Cleanup"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"3596dc71-a363-4b6a-a169-215c89978558"}}},{"cell_type":"code","source":["# Remove temporary files\ndbutils.fs.rm(\"dbfs:/tmp/\", recurse=True)"],"metadata":{"application/vnd.databricks.v1+cell":{"title":"","showTitle":false,"inputWidgets":{},"nuid":"b5fb292e-bbb6-4dd7-8e79-c62d9533e820"}},"outputs":[],"execution_count":0}],"metadata":{"kernelspec":{"display_name":"Python 3.8.10 ('logistics')","language":"python","name":"python3"},"language_info":{"mimetype":"text/x-python","name":"python","pygments_lexer":"ipython3","codemirror_mode":{"name":"ipython","version":3},"version":"3.8.10","nbconvert_exporter":"python","file_extension":".py"},"vscode":{"interpreter":{"hash":"6d25d3d1f1809ed0384c3d8e0cd4f1df57fe7bb936ead67f035c6ff1494f4e23"}},"application/vnd.databricks.v1+notebook":{"notebookName":"databricks_quickstart_nyc_taxi_demo","dashboards":[],"notebookMetadata":{"pythonIndentUnit":4},"language":"python","widgets":{"REDIS_KEY":{"nuid":"d39ce0d5-bcfe-47ef-b3d9-eff67e5cdeca","currentValue":"","widgetInfo":{"widgetType":"text","name":"REDIS_KEY","defaultValue":"","label":null,"options":{"widgetType":"text","validationRegex":null}}},"RESOURCE_PREFIX":{"nuid":"87a26035-86fc-4dbd-8dd0-dc546c1c63c1","currentValue":"","widgetInfo":{"widgetType":"text","name":"RESOURCE_PREFIX","defaultValue":"","label":null,"options":{"widgetType":"text","validationRegex":null}}}},"notebookOrigID":2365994027381987}},"nbformat":4,"nbformat_minor":0}
+{"cells":[{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"843d3142-24ca-4bd1-9e31-b55163804fe3","showTitle":false,"title":""}},"outputs":[],"source":["dbutils.widgets.text(\"RESOURCE_PREFIX\", \"\")\n","dbutils.widgets.text(\"REDIS_KEY\", \"\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"384e5e16-7213-4186-9d04-09d03b155534","showTitle":false,"title":""}},"source":["# Feathr Feature Store on Databricks Demo Notebook\n","\n","This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n","\n","This notebook is specifically written for Databricks and is relying on some of the Databricks packages such as `dbutils`. The intention here is to provide a \"one click run\" example with minimum configuration. For example:\n","- This notebook skips feature registry which requires running Azure Purview. \n","- To make the online feature query work, you will need to configure the Redis endpoint. \n","\n","The full-fledged notebook can be found from [here](https://github.com/feathr-ai/feathr/blob/main/docs/samples/nyc_taxi_demo.ipynb)."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c2ce58c7-9263-469a-bbb7-43364ddb07b8","showTitle":false,"title":""}},"source":["## Prerequisite\n","\n","To use feathr materialization for online scoring with Redis cache, you may deploy a Redis cluster and set `RESOURCE_PREFIX` and `REDIS_KEY` via Databricks widgets. Note that the deployed Redis host address should be `{RESOURCE_PREFIX}redis.redis.cache.windows.net`. More details about how to deploy the Redis cluster can be found [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html#configurure-redis-cluster).\n","\n","To run this notebook, you'll need to install `feathr` pip package. Here, we install notebook-scoped library. For details, please see [Azure Databricks dependency management document](https://learn.microsoft.com/en-us/azure/databricks/libraries/)."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"4609d7ad-ad74-40fc-b97e-f440a0fa0737","showTitle":false,"title":""}},"outputs":[],"source":["!pip install feathr"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c81fa80c-bca6-4ae5-84ad-659a036977bd","showTitle":false,"title":""}},"source":["## Notebook Steps\n","\n","This tutorial demonstrates the key capabilities of Feathr, including:\n","\n","1. Install Feathr and necessary dependencies.\n","1. Create shareable features with Feathr feature definition configs.\n","1. Create training data using point-in-time correct feature join\n","1. Train and evaluate a prediction model.\n","1. Materialize feature values for online scoring.\n","\n","The overall data flow is as follows:\n","\n","<img src=\"https://raw.githubusercontent.com/feathr-ai/feathr/main/docs/images/feature_flow.png\" width=\"800\">"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"80223a02-631c-40c8-91b3-a037249ffff9","showTitle":false,"title":""}},"outputs":[],"source":["from datetime import datetime, timedelta\n","import glob\n","import json\n","from math import sqrt\n","import os\n","from pathlib import Path\n","import requests\n","from tempfile import TemporaryDirectory\n","\n","from azure.identity import AzureCliCredential, DefaultAzureCredential \n","from azure.keyvault.secrets import SecretClient\n","import pandas as pd\n","from pyspark.ml import Pipeline\n","from pyspark.ml.evaluation import RegressionEvaluator\n","from pyspark.ml.feature import VectorAssembler\n","from pyspark.ml.regression import GBTRegressor\n","from pyspark.sql import DataFrame, SparkSession\n","import pyspark.sql.functions as F\n","\n","import feathr\n","from feathr import (\n","    FeathrClient,\n","    # Feature data types\n","    BOOLEAN, FLOAT, INT32, ValueType,\n","    # Feature data sources\n","    INPUT_CONTEXT, HdfsSource,\n","    # Feature aggregations\n","    TypedKey, WindowAggTransformation,\n","    # Feature types and anchor\n","    DerivedFeature, Feature, FeatureAnchor,\n","    # Materialization\n","    BackfillTime, MaterializationSettings, RedisSink,\n","    # Offline feature computation\n","    FeatureQuery, ObservationSettings,\n",")\n","from feathr.datasets import nyc_taxi\n","from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\n","from feathr.utils.config import generate_config\n","from feathr.utils.job_utils import get_result_df\n","\n","\n","print(f\"\"\"Feathr version: {feathr.__version__}\n","Databricks runtime version: {spark.conf.get(\"spark.databricks.clusterUsageTags.sparkVersion\")}\"\"\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"ab35fa01-b392-457e-8fde-7e445a3c39b5","showTitle":false,"title":""}},"source":["## 2. Create Shareable Features with Feathr Feature Definition Configs\n","\n","In this notebook, we define all the necessary resource key values for authentication. We use the values passed by the databricks widgets at the top of this notebook. Instead of manually entering the values to the widgets, we can also use [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) to retrieve them.\n","Please refer to [how-to guide documents for granting key-vault access](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html#3-grant-key-vault-and-synapse-access-to-selected-users-optional) and [Databricks' Azure Key Vault-backed scopes](https://learn.microsoft.com/en-us/azure/databricks/security/secrets/secret-scopes) for more details."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"09f93a9f-7b33-4d91-8f31-ee3b20991696","showTitle":false,"title":""}},"outputs":[],"source":["RESOURCE_PREFIX = dbutils.widgets.get(\"RESOURCE_PREFIX\")\n","PROJECT_NAME = \"feathr_getting_started\"\n","\n","REDIS_KEY = dbutils.widgets.get(\"REDIS_KEY\")\n","\n","# Use a databricks cluster\n","SPARK_CLUSTER = \"databricks\"\n","\n","# Databricks file system path\n","DATA_STORE_PATH = f\"dbfs:/{PROJECT_NAME}\""]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"41d3648a-9bc9-40dc-90da-bc82b21ef9b3","showTitle":false,"title":""}},"source":["In the following cell, we set required databricks credentials automatically by using a databricks notebook context object as well as new job cluster spec.\n","\n","Note: When submitting jobs, Databricks recommend to use new clusters for greater reliability. If you want to use an existing all-purpose cluster, you may set\n","`existing_cluster_id': ctx.tags().get('clusterId').get()` to the `databricks_config`, replacing `new_cluster` config values."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"331753d6-1850-47b5-ad97-84b7c01d79d1","showTitle":false,"title":""}},"outputs":[],"source":["# Redis credential\n","os.environ['REDIS_PASSWORD'] = REDIS_KEY\n","\n","# Setup databricks env configs\n","ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n","databricks_config = {\n","    'run_name': \"FEATHR_FILL_IN\",\n","    # To use an existing all-purpose cluster:\n","    # 'existing_cluster_id': ctx.tags().get('clusterId').get(),\n","    # To use a new job cluster:\n","    'new_cluster': {\n","        'spark_version': \"11.2.x-scala2.12\",\n","        'node_type_id': \"Standard_D3_v2\",\n","        'num_workers':1,\n","        'spark_conf': {\n","            'FEATHR_FILL_IN': \"FEATHR_FILL_IN\",\n","            # Exclude conflicting packages if use feathr <= v0.8.0:\n","            'spark.jars.excludes': \"commons-logging:commons-logging,org.slf4j:slf4j-api,com.google.protobuf:protobuf-java,javax.xml.bind:jaxb-api\",\n","        },\n","    },\n","    'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n","    'spark_jar_task': {\n","        'main_class_name': \"FEATHR_FILL_IN\",\n","        'parameters': [\"FEATHR_FILL_IN\"],\n","    },\n","}\n","os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\n","os.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\n","os.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\n","os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee","showTitle":false,"title":""}},"source":["### Configurations\n","\n","Feathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"8cd64e3a-376c-48e6-ba41-5197f3591d48","showTitle":false,"title":""}},"outputs":[],"source":["config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n","\n","with open(config_path, 'r') as f: \n","    print(f.read())"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"58d22dc1-7590-494d-94ca-3e2488c31c8e","showTitle":false,"title":""}},"source":["All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3fef7f2f-df19-4f53-90a5-ff7999ed983d","showTitle":false,"title":""}},"source":["### Initialize Feathr Client"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"9713a2df-c7b2-4562-88b0-b7acce3cc43a","showTitle":false,"title":""}},"outputs":[],"source":["client = FeathrClient(config_path=config_path)"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c3b64bda-d42c-4a64-b976-0fb604cf38c5","showTitle":false,"title":""}},"source":["### View the NYC taxi fare dataset"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c4ccd7b3-298a-4e5a-8eec-b7e309db393e","showTitle":false,"title":""}},"outputs":[],"source":["DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n","\n","# Download the data file\n","df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\n","df_raw.limit(5).toPandas()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"7430c942-64e5-4b70-b823-16ce1d1b3cee","showTitle":false,"title":""}},"source":["### Defining features with Feathr\n","\n","In Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n","\n","* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n","* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n","* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n","\n","Note that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n","\n","There are two types of features -- anchored features and derivated features:\n","\n","* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n","* **Derived features**: Features that are computed on top of other features.\n","\n","#### Define anchored features\n","\n","A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"75b8d2ed-84df-4446-ae07-5f715434f3ea","showTitle":false,"title":""}},"outputs":[],"source":["TIMESTAMP_COL = \"lpep_dropoff_datetime\"\n","TIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"93abbcc2-562b-47e4-ad4c-1fedd7cc64df","showTitle":false,"title":""}},"outputs":[],"source":["# We define f_trip_distance and f_trip_time_duration features separately\n","# so that we can reuse them later for the derived features.\n","f_trip_distance = Feature(\n","    name=\"f_trip_distance\",\n","    feature_type=FLOAT,\n","    transform=\"trip_distance\",\n",")\n","f_trip_time_duration = Feature(\n","    name=\"f_trip_time_duration\",\n","    feature_type=FLOAT,\n","    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n",")\n","\n","features = [\n","    f_trip_distance,\n","    f_trip_time_duration,\n","    Feature(\n","        name=\"f_is_long_trip_distance\",\n","        feature_type=BOOLEAN,\n","        transform=\"trip_distance > 30.0\",\n","    ),\n","    Feature(\n","        name=\"f_day_of_week\",\n","        feature_type=INT32,\n","        transform=\"dayofweek(lpep_dropoff_datetime)\",\n","    ),\n","    Feature(\n","        name=\"f_day_of_month\",\n","        feature_type=INT32,\n","        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n","    ),\n","    Feature(\n","        name=\"f_hour_of_day\",\n","        feature_type=INT32,\n","        transform=\"hour(lpep_dropoff_datetime)\",\n","    ),\n","]\n","\n","# After you have defined features, bring them together to build the anchor to the source.\n","feature_anchor = FeatureAnchor(\n","    name=\"feature_anchor\",\n","    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n","    features=features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"728d2d5f-c11f-4941-bdc5-48507f5749f1","showTitle":false,"title":""}},"source":["We can define the source with a preprocessing python function."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3cc59a0e-a41b-480e-a84e-ca5443d63143","showTitle":false,"title":""}},"outputs":[],"source":["def preprocessing(df: DataFrame) -> DataFrame:\n","    import pyspark.sql.functions as F\n","    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n","    return df\n","\n","batch_source = HdfsSource(\n","    name=\"nycTaxiBatchSource\",\n","    path=DATA_FILE_PATH,\n","    event_timestamp_column=TIMESTAMP_COL,\n","    preprocessing=preprocessing,\n","    timestamp_format=TIMESTAMP_FORMAT,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"46f863c4-bb81-434a-a448-6b585031a221","showTitle":false,"title":""}},"source":["For the features with aggregation, the supported functions are as follows:\n","\n","| Aggregation Function | Input Type | Description |\n","| --- | --- | --- |\n","|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n","|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n","|LATEST| Any |Returns the latest not-null values from within the defined time window |"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"a373ecbe-a040-4cd3-9d87-0d5f4c5ba553","showTitle":false,"title":""}},"outputs":[],"source":["agg_key = TypedKey(\n","    key_column=\"DOLocationID\",\n","    key_column_type=ValueType.INT32,\n","    description=\"location id in NYC\",\n","    full_name=\"nyc_taxi.location_id\",\n",")\n","\n","agg_window = \"90d\"\n","\n","# Anchored features with aggregations\n","agg_features = [\n","    Feature(\n","        name=\"f_location_avg_fare\",\n","        key=agg_key,\n","        feature_type=FLOAT,\n","        transform=WindowAggTransformation(\n","            agg_expr=\"fare_amount_cents\",\n","            agg_func=\"AVG\",\n","            window=agg_window,\n","        ),\n","    ),\n","    Feature(\n","        name=\"f_location_max_fare\",\n","        key=agg_key,\n","        feature_type=FLOAT,\n","        transform=WindowAggTransformation(\n","            agg_expr=\"fare_amount_cents\",\n","            agg_func=\"MAX\",\n","            window=agg_window,\n","        ),\n","    ),\n","]\n","\n","agg_feature_anchor = FeatureAnchor(\n","    name=\"agg_feature_anchor\",\n","    source=batch_source,  # External data source for feature. Typically a data table.\n","    features=agg_features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"149f85e2-fa3c-4895-b0c5-de5543ca9b6d","showTitle":false,"title":""}},"source":["#### Define derived features\n","\n","We also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"05633bc3-9118-449b-9562-45fc437576c2","showTitle":false,"title":""}},"outputs":[],"source":["derived_features = [\n","    DerivedFeature(\n","        name=\"f_trip_time_distance\",\n","        feature_type=FLOAT,\n","        input_features=[\n","            f_trip_distance,\n","            f_trip_time_duration,\n","        ],\n","        transform=\"f_trip_distance / f_trip_time_duration\",\n","    )\n","]"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"ad102c45-586d-468c-85f0-9454401ef10b","showTitle":false,"title":""}},"source":["### Build features\n","\n","Finally, we build the features."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"91bb5ebb-87e4-470b-b8eb-1c89b351740e","showTitle":false,"title":""}},"outputs":[],"source":["client.build_features(\n","    anchor_list=[feature_anchor, agg_feature_anchor],\n","    derived_feature_list=derived_features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"632d5f46-f9e2-41a8-aab7-34f75206e2aa","showTitle":false,"title":""}},"source":["## 3. Create Training Data Using Point-in-Time Correct Feature Join\n","\n","After the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n","\n","To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n","what features and how these features should be joined to the observation data. \n","\n","To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"02feabc9-2f2f-43e8-898d-b28082798e98","showTitle":false,"title":""}},"outputs":[],"source":["feature_names = [feature.name for feature in features + agg_features + derived_features]\n","feature_names"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f","showTitle":false,"title":""}},"outputs":[],"source":["DATA_FORMAT = \"parquet\"\n","offline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"67e81466-c736-47ba-b122-e640642c01cf","showTitle":false,"title":""}},"outputs":[],"source":["# Features that we want to request. Can use a subset of features\n","query = FeatureQuery(\n","    feature_list=feature_names,\n","    key=agg_key,\n",")\n","settings = ObservationSettings(\n","    observation_path=DATA_FILE_PATH,\n","    event_timestamp_column=TIMESTAMP_COL,\n","    timestamp_format=TIMESTAMP_FORMAT,\n",")\n","client.get_offline_features(\n","    observation_settings=settings,\n","    feature_query=query,\n","    # Note, execution_configurations argument only works when using a new job cluster\n","    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n","    execution_configurations=SparkExecutionConfiguration({\n","        \"spark.feathr.outputFormat\": DATA_FORMAT,\n","    }),\n","    output_path=offline_features_path,\n",")\n","\n","client.wait_job_to_finish(timeout_sec=500)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"9871af55-25eb-41ee-a58a-fda74b1a174e","showTitle":false,"title":""}},"outputs":[],"source":["# Show feature results\n","df = get_result_df(\n","    spark=spark,\n","    client=client,\n","    data_format=\"parquet\",\n","    res_url=offline_features_path,\n",")\n","df.select(feature_names).limit(5).toPandas()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f","showTitle":false,"title":""}},"source":["## 4. Train and Evaluate a Prediction Model\n","\n","After generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n","\n","Note that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"5a226026-1c7b-48db-8f91-88d5c2ddf023","showTitle":false,"title":""}},"source":["### Load Train and Test Data from the Offline Feature Values"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"bd2cdc83-0920-46e8-9454-e5e6e7832ce0","showTitle":false,"title":""}},"outputs":[],"source":["# Train / test split\n","train_df, test_df = (\n","    df  # Dataframe that we generated from get_offline_features call.\n","    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n","    .where(F.col(\"f_trip_time_duration\") > 0)\n","    .fillna(0)\n","    .randomSplit([0.8, 0.2])\n",")\n","\n","print(f\"Num train samples: {train_df.count()}\")\n","print(f\"Num test samples: {test_df.count()}\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd","showTitle":false,"title":""}},"source":["### Build a ML Pipeline\n","\n","Here, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"2a254361-63e9-45b2-8c19-40549762eacb","showTitle":false,"title":""}},"outputs":[],"source":["# Generate a feature vector column for SparkML\n","vector_assembler = VectorAssembler(\n","    inputCols=[x for x in df.columns if x in feature_names],\n","    outputCol=\"features\",\n",")\n","\n","# Define a model\n","gbt = GBTRegressor(\n","    featuresCol=\"features\",\n","    maxIter=100,\n","    maxDepth=5,\n","    maxBins=16,\n",")\n","\n","# Create a ML pipeline\n","ml_pipeline = Pipeline(stages=[\n","    vector_assembler,\n","    gbt,\n","])"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"bef93538-9591-4247-97b6-289d2055b7b1","showTitle":false,"title":""}},"source":["### Train and Evaluate the Model"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"0c3d5f35-11a3-4644-9992-5860169d8302","showTitle":false,"title":""}},"outputs":[],"source":["# Train a model\n","model = ml_pipeline.fit(train_df)\n","\n","# Make predictions\n","predictions = model.transform(test_df)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"1f9b584c-6228-4a02-a6c3-9b8dd2b78091","showTitle":false,"title":""}},"outputs":[],"source":["# Evaluate\n","evaluator = RegressionEvaluator(\n","    labelCol=\"label\",\n","    predictionCol=\"prediction\",\n",")\n","\n","rmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\n","mae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\n","print(f\"RMSE: {rmse}\\nMAE: {mae}\")"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"25c33abd-6e87-437d-a6a1-86435f065a1e","showTitle":false,"title":""}},"outputs":[],"source":["# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\n","predictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n","\n","predictions_pdf.plot(\n","    x=\"index\",\n","    y=[\"label\", \"prediction\"],\n","    style=['-', ':'],\n","    figsize=(20, 10),\n",")"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"664d78cc-4a92-430c-9e05-565ba904558e","showTitle":false,"title":""}},"outputs":[],"source":["predictions_pdf.plot.scatter(\n","    x=\"label\",\n","    y=\"prediction\",\n","    xlim=(0, 100),\n","    ylim=(0, 100),\n","    figsize=(10, 10),\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"8a56d165-c813-4ce0-8ae6-9f4d313c463d","showTitle":false,"title":""}},"source":["## 5. Materialize Feature Values for Online Scoring\n","\n","While we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n","\n","Note, only the features anchored to offline data source can be materialized."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"751fa72e-8f94-40a1-994e-3e8315b51d37","showTitle":false,"title":""}},"outputs":[],"source":["materialized_feature_names = [feature.name for feature in agg_features]\n","materialized_feature_names"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"4d4699ed-42e6-408f-903d-2f799284f4b6","showTitle":false,"title":""}},"outputs":[],"source":["if REDIS_KEY and RESOURCE_PREFIX:\n","    FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n","\n","    # Get the last date from the dataset\n","    backfill_timestamp = (\n","        df_raw\n","        .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n","        .agg({TIMESTAMP_COL: \"max\"})\n","        .collect()[0][0]\n","    )\n","\n","    # Time range to materialize\n","    backfill_time = BackfillTime(\n","        start=backfill_timestamp,\n","        end=backfill_timestamp,\n","        step=timedelta(days=1),\n","    )\n","\n","    # Destinations:\n","    # For online store,\n","    redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n","\n","    # For offline store,\n","    # adls_sink = HdfsSink(output_path=)\n","\n","    settings = MaterializationSettings(\n","        name=FEATURE_TABLE_NAME + \".job\",  # job name\n","        backfill_time=backfill_time,\n","        sinks=[redis_sink],  # or adls_sink\n","        feature_names=materialized_feature_names,\n","    )\n","\n","    client.materialize_features(\n","        settings=settings,\n","        # Note, execution_configurations argument only works when using a new job cluster\n","        execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n","    )\n","\n","    client.wait_job_to_finish(timeout_sec=500)"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"5aa13acd-58ec-4fc2-86bb-dc1d9951ebb9","showTitle":false,"title":""}},"source":["Now, you can retrieve features for online scoring as follows:"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"424bc9eb-a47f-4b46-be69-8218d55e66ad","showTitle":false,"title":""}},"outputs":[],"source":["if REDIS_KEY and RESOURCE_PREFIX:\n","    # Note, to get a single key, you may use client.get_online_features instead\n","    materialized_feature_values = client.multi_get_online_features(\n","        feature_table=FEATURE_TABLE_NAME,\n","        keys=[\"239\", \"265\"],\n","        feature_names=materialized_feature_names,\n","    )\n","    materialized_feature_values"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3596dc71-a363-4b6a-a169-215c89978558","showTitle":false,"title":""}},"source":["## Cleanup"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"b5fb292e-bbb6-4dd7-8e79-c62d9533e820","showTitle":false,"title":""}},"outputs":[],"source":["# Remove temporary files\n","dbutils.fs.rm(\"dbfs:/tmp/\", recurse=True)"]}],"metadata":{"application/vnd.databricks.v1+notebook":{"dashboards":[],"language":"python","notebookMetadata":{"pythonIndentUnit":4},"notebookName":"databricks_quickstart_nyc_taxi_demo","notebookOrigID":2365994027381987,"widgets":{"REDIS_KEY":{"currentValue":"","nuid":"d39ce0d5-bcfe-47ef-b3d9-eff67e5cdeca","widgetInfo":{"defaultValue":"","label":null,"name":"REDIS_KEY","options":{"validationRegex":null,"widgetType":"text"},"widgetType":"text"}},"RESOURCE_PREFIX":{"currentValue":"","nuid":"87a26035-86fc-4dbd-8dd0-dc546c1c63c1","widgetInfo":{"defaultValue":"","label":null,"name":"RESOURCE_PREFIX","options":{"validationRegex":null,"widgetType":"text"},"widgetType":"text"}}}},"kernelspec":{"display_name":"Python 3.10.4 ('feathr')","language":"python","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.10.4"},"vscode":{"interpreter":{"hash":"ddb0e38f168d5afaa0b8ab4851ddd8c14364f1d087c15de6ff2ee5a559aec1f2"}}},"nbformat":4,"nbformat_minor":0}
diff --git a/docs/samples/nyc_taxi_demo.ipynb b/docs/samples/nyc_taxi_demo.ipynb
index bb41bd2fe..b789e9bf2 100644
--- a/docs/samples/nyc_taxi_demo.ipynb
+++ b/docs/samples/nyc_taxi_demo.ipynb
@@ -54,7 +54,7 @@
     "\n",
     "The overall data flow is as follows:\n",
     "\n",
-    "<img src=\"https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true\" width=\"800\">"
+    "<img src=\"https://raw.githubusercontent.com/feathr-ai/feathr/main/docs/images/feature_flow.png\" width=\"800\">"
    ]
   },
   {

From ff438f5ed2ec11271dac8121f0f4071be0d5a279 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Mon, 31 Oct 2022 14:47:24 +0800
Subject: [PATCH 46/68] Revert 756 (#798)

* Revert "Refine example notebooks (#756)"

This reverts commit 2f7e1fd066319bf80baa10335b603257c832b13c.

* Resolve conflict
---
 docs/dev_guide/new_contributor_guide.md       |    6 +-
 docs/quickstart_databricks.md                 |    6 +-
 docs/quickstart_synapse.md                    |    2 +-
 docs/samples/nyc_taxi_demo.ipynb              | 1110 -----------------
 feathr_project/feathr/client.py               |    2 +-
 feathr_project/feathr/datasets/__init__.py    |    9 -
 feathr_project/feathr/datasets/constants.py   |    3 -
 feathr_project/feathr/datasets/nyc_taxi.py    |   87 --
 feathr_project/feathr/datasets/utils.py       |   64 -
 .../spark_provider/_databricks_submission.py  |  181 ++-
 feathr_project/feathr/utils/config.py         |   61 -
 feathr_project/feathr/utils/job_utils.py      |  218 +---
 feathr_project/feathr/utils/platform.py       |   45 -
 .../demo_data/green_tripdata_2020-04.csv      |   14 +
 .../product_detail_mock_data.csv              |   11 +
 .../user_observation_mock_data.csv            |   35 +
 .../user_profile_mock_data.csv                |   11 +
 .../user_purchase_history_mock_data.csv       |   31 +
 .../nyc_driver_demo.ipynb                     |  720 +++++++++++
 feathr_project/setup.py                       |    3 +-
 feathr_project/test/samples/test_notebooks.py |   56 -
 .../test/unit/datasets/test_dataset_utils.py  |   53 -
 .../test/unit/datasets/test_datasets.py       |  106 --
 feathr_project/test/unit/utils/test_config.py |   31 -
 24 files changed, 958 insertions(+), 1907 deletions(-)
 delete mode 100644 docs/samples/nyc_taxi_demo.ipynb
 delete mode 100644 feathr_project/feathr/datasets/__init__.py
 delete mode 100644 feathr_project/feathr/datasets/constants.py
 delete mode 100644 feathr_project/feathr/datasets/nyc_taxi.py
 delete mode 100644 feathr_project/feathr/datasets/utils.py
 delete mode 100644 feathr_project/feathr/utils/config.py
 delete mode 100644 feathr_project/feathr/utils/platform.py
 create mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv
 create mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv
 create mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv
 create mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv
 create mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv
 create mode 100644 feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
 delete mode 100644 feathr_project/test/samples/test_notebooks.py
 delete mode 100644 feathr_project/test/unit/datasets/test_dataset_utils.py
 delete mode 100644 feathr_project/test/unit/datasets/test_datasets.py
 delete mode 100644 feathr_project/test/unit/utils/test_config.py

diff --git a/docs/dev_guide/new_contributor_guide.md b/docs/dev_guide/new_contributor_guide.md
index 223b7d91b..1856ffd84 100644
--- a/docs/dev_guide/new_contributor_guide.md
+++ b/docs/dev_guide/new_contributor_guide.md
@@ -6,11 +6,11 @@ parent: Feathr Developer Guides
 
 # What can I contribute?
 All forms of contributions are welcome, including and not limited to:
-* Improve or contribute new [notebook samples](https://github.com/feathr-ai/feathr/tree/main/docs/samples)
+* Improve or contribute new [notebook samples](https://github.com/feathr-ai/feathr/tree/main/feathr_project/feathrcli/data/feathr_user_workspace)
 * Add tutorial, blog posts, tech talks etc
 * Increase media coverage and exposure
 * Improve user-facing documentation or developer-facing documentation
-* Add testing code
+* Add testing code 
 * Add new features
 * Refactor and improve architecture
 * For any other forms of contribution and collaboration, don't hesitate to reach out to us.
@@ -18,7 +18,7 @@ All forms of contributions are welcome, including and not limited to:
 # I am interested, how can I start?
 If you are new to this project, we recommend start with [`good-first-issue`](https://github.com/feathr-ai/feathr/issues?q=is%3Aissue+is%3Aopen+label%3A%22good+first+issue%22).
 
-The issues are also labled with what types of programming language the task need.
+The issues are also labled with what types of programming language the task need. 
 * [`good-first-issue` and `Python`](https://github.com/feathr-ai/feathr/issues?q=is%3Aopen+label%3A%22good+first+issue%22+label%3Apython)
 * [`good-first-issue` and `Scala`](https://github.com/feathr-ai/feathr/issues?q=is%3Aopen+label%3A%22good+first+issue%22+label%3Ascala)
 * [`good-first-issue` and `Java`](https://github.com/feathr-ai/feathr/issues?q=is%3Aopen+label%3A%22good+first+issue%22+label%3Ajava)
diff --git a/docs/quickstart_databricks.md b/docs/quickstart_databricks.md
index 30eaaa835..dff5b5f0f 100644
--- a/docs/quickstart_databricks.md
+++ b/docs/quickstart_databricks.md
@@ -5,13 +5,13 @@ title: Quick Start Guide with Databricks
 
 # Feathr Quick Start Guide with Databricks
 
-For Databricks, you can simply upload [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb) to your Databricks cluster and just run it in the Databricks cluster. It has been pre-configured to use the current Databricks cluster to submit jobs.
+For Databricks, you can simply upload [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb) to your Databricks cluster and just run it in the Databricks cluster. It has been pre-configured to use the current Databricks cluster to submit jobs.
 
 1. Import Notebooks in your Databricks cluster:
 
 ![Import Notebooks](./images/databricks_quickstart1.png)
 
-2. Paste the [link to Databricks getting started notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb):
+2. Paste the [link to Databricks getting started notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb):
 
 ![Import Notebooks](./images/databricks_quickstart2.png)
 
@@ -21,7 +21,7 @@ For Databricks, you can simply upload [this notebook](./samples/databricks/datab
 
 Although Databricks Notebooks are great tools, there are also large developer communities that prefer the usage of Visual Studio Code, where [it has native support for Python and Jupyter Notebooks](https://code.visualstudio.com/docs/datascience/jupyter-notebooks) with many great features such as syntax highlight and IntelliSense.
 
-In [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb), there are a few lines of code like this:
+In [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb), there are a few lines of code like this:
 
 ```python
 # Get current databricks notebook context
diff --git a/docs/quickstart_synapse.md b/docs/quickstart_synapse.md
index c310dd789..d07198d92 100644
--- a/docs/quickstart_synapse.md
+++ b/docs/quickstart_synapse.md
@@ -24,7 +24,7 @@ Feathr has native cloud integration. Here are the steps to use Feathr on Azure:
 
 1. Follow the [Feathr ARM deployment guide](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to run Feathr on Azure. This allows you to quickly get started with automated deployment using Azure Resource Manager template. Alternatively, if you want to set up everything manually, you can checkout the [Feathr CLI deployment guide](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) to run Feathr on Azure. This allows you to understand what is going on and set up one resource at a time.
 
-2. Once the deployment is complete,run the Feathr Jupyter Notebook by clicking this button:  [![Binder](https://mybinder.org/badge_logo.svg)](https://mybinder.org/v2/gh/feathr-ai/feathr/main?labpath=docs%2Fsamples%2Fnyc_taxi_demo.ipynb).
+2. Once the deployment is complete,run the Feathr Jupyter Notebook by clicking this button:  [![Binder](https://mybinder.org/badge_logo.svg)](https://mybinder.org/v2/gh/feathr-ai/feathr/main?labpath=feathr_project%2Ffeathrcli%2Fdata%2Ffeathr_user_workspace%2Fnyc_driver_demo.ipynb). 
 3. You only need to change the specified `Resource Prefix`.
 
 ## Step 2: Install Feathr
diff --git a/docs/samples/nyc_taxi_demo.ipynb b/docs/samples/nyc_taxi_demo.ipynb
deleted file mode 100644
index b789e9bf2..000000000
--- a/docs/samples/nyc_taxi_demo.ipynb
+++ /dev/null
@@ -1,1110 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "384e5e16-7213-4186-9d04-09d03b155534",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "# Feathr Quick Start Notebook\n",
-    "\n",
-    "This notebook illustrates the use of Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n",
-    "\n",
-    "The major problems Feathr solves are:\n",
-    "\n",
-    "1. Create, share and manage useful features from raw source data.\n",
-    "2. Provide Point-in-time feature join to create training dataset to ensure no data leakage.\n",
-    "3. Deploy the same feature data to online store to eliminate training and inference data skew."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Prerequisite\n",
-    "\n",
-    "Feathr has native cloud integration. First step is to provision required cloud resources if you want to use Feathr.\n",
-    "\n",
-    "Follow the [Feathr ARM deployment guide](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to run Feathr on Azure. This allows you to quickly get started with automated deployment using Azure Resource Manager template. For more details, please refer [README.md](https://github.com/feathr-ai/feathr#%EF%B8%8F-running-feathr-on-cloud-with-a-few-simple-steps).\n",
-    "\n",
-    "Additionally, to run this notebook, you'll need to install `feathr` pip package. For local spark, simply run `pip install feathr` on the machine that runs this notebook. To use Databricks or Azure Synapse Analytics, please see dependency management documents:\n",
-    "- [Azure Databricks dependency management](https://learn.microsoft.com/en-us/azure/databricks/libraries/)\n",
-    "- [Azure Synapse Analytics dependency management](https://learn.microsoft.com/en-us/azure/synapse-analytics/spark/apache-spark-azure-portal-add-libraries)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Notebook Steps\n",
-    "\n",
-    "This tutorial demonstrates the key capabilities of Feathr, including:\n",
-    "\n",
-    "1. Install Feathr and necessary dependencies\n",
-    "2. Create shareable features with Feathr feature definition configs\n",
-    "3. Create training data using point-in-time correct feature join\n",
-    "4. Train a prediction model and evaluate the model and features\n",
-    "5. Register the features to share across teams\n",
-    "6. Materialize feature values for online scoring\n",
-    "\n",
-    "The overall data flow is as follows:\n",
-    "\n",
-    "<img src=\"https://raw.githubusercontent.com/feathr-ai/feathr/main/docs/images/feature_flow.png\" width=\"800\">"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## 1. Install Feathr and Necessary Dependancies\n",
-    "\n",
-    "Install feathr and necessary packages by running `pip install feathr[notebook]` if you haven't installed them already."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%load_ext autoreload\n",
-    "%autoreload 2"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "80223a02-631c-40c8-91b3-a037249ffff9",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "from datetime import datetime, timedelta\n",
-    "import glob\n",
-    "import json\n",
-    "from math import sqrt\n",
-    "import os\n",
-    "from pathlib import Path\n",
-    "import requests\n",
-    "from tempfile import TemporaryDirectory\n",
-    "\n",
-    "from azure.identity import AzureCliCredential, DefaultAzureCredential \n",
-    "from azure.keyvault.secrets import SecretClient\n",
-    "import pandas as pd\n",
-    "from pyspark.ml import Pipeline\n",
-    "from pyspark.ml.evaluation import RegressionEvaluator\n",
-    "from pyspark.ml.feature import VectorAssembler\n",
-    "from pyspark.ml.regression import GBTRegressor\n",
-    "from pyspark.sql import DataFrame, SparkSession\n",
-    "import pyspark.sql.functions as F\n",
-    "\n",
-    "import feathr\n",
-    "from feathr import (\n",
-    "    FeathrClient,\n",
-    "    # Feature data types\n",
-    "    BOOLEAN, FLOAT, INT32, ValueType,\n",
-    "    # Feature data sources\n",
-    "    INPUT_CONTEXT, HdfsSource,\n",
-    "    # Feature aggregations\n",
-    "    TypedKey, WindowAggTransformation,\n",
-    "    # Feature types and anchor\n",
-    "    DerivedFeature, Feature, FeatureAnchor,\n",
-    "    # Materialization\n",
-    "    BackfillTime, MaterializationSettings, RedisSink,\n",
-    "    # Offline feature computation\n",
-    "    FeatureQuery, ObservationSettings,\n",
-    ")\n",
-    "from feathr.datasets import nyc_taxi\n",
-    "from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\n",
-    "from feathr.utils.config import generate_config\n",
-    "from feathr.utils.job_utils import get_result_df\n",
-    "from feathr.utils.platform import is_databricks, is_jupyter\n",
-    "\n",
-    "print(f\"Feathr version: {feathr.__version__}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## 2. Create Shareable Features with Feathr Feature Definition Configs\n",
-    "\n",
-    "First, we define all the necessary resource key values for authentication. These values are retrieved by using [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) cloud key value store. For authentication, we use Azure CLI credential in this notebook, but you may add secrets' list and get permission for the necessary service principal instead of running `az login --use-device-code`.\n",
-    "\n",
-    "Please refer to [A note on using azure key vault to store credentials](https://github.com/feathr-ai/feathr/blob/41e7496b38c43af6d7f8f1de842f657b27840f6d/docs/how-to-guides/feathr-configuration-and-env.md#a-note-on-using-azure-key-vault-to-store-credentials) for more details."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "tags": [
-     "parameters"
-    ]
-   },
-   "outputs": [],
-   "source": [
-    "RESOURCE_PREFIX = None  # TODO fill the value\n",
-    "PROJECT_NAME = \"feathr_getting_started\"\n",
-    "\n",
-    "# Data store root path. Could be a local file system path or Azure storage path like abfs or wasbs\n",
-    "DATA_STORE_PATH = TemporaryDirectory().name\n",
-    "\n",
-    "# Currently support: 'azure_synapse', 'databricks', and 'local' \n",
-    "SPARK_CLUSTER = \"local\"\n",
-    "# TODO -- Synapse spark pool name or Databricks cluster id\n",
-    "CLUSTER_NAME = None\n",
-    "\n",
-    "# If set True, use an interactive browser authentication\n",
-    "USE_CLI_AUTH = False\n",
-    "\n",
-    "# (For the notebook test pipeline) If true, use ScrapBook package to collect the results.\n",
-    "SCRAP_RESULTS = False"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "KEY_VAULT = f\"{RESOURCE_PREFIX}kv\"\n",
-    "KEY_VAULT_URI = f\"https://{KEY_VAULT}.vault.azure.net\"\n",
-    "\n",
-    "ADLS_PATH = f\"abfss://{RESOURCE_PREFIX}fs@{RESOURCE_PREFIX}dls.dfs.core.windows.net/feathr_project\"\n",
-    "\n",
-    "if SPARK_CLUSTER == \"azure_synapse\":\n",
-    "    os.environ['spark_config__azure_synapse__dev_url'] = f\"https://{resource_prefix}syws.dev.azuresynapse.net\"\n",
-    "    os.environ['spark_config__azure_synapse__pool_name'] = CLUSTER_NAME\n",
-    "    os.environ['spark_config__azure_synapse__workspace_dir'] = f\"abfss://{adls_fs_name}@{resource_prefix}dls.dfs.core.windows.net/{PROJECT_NAME}\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "if USE_CLI_AUTH:\n",
-    "    !az login --use-device-code"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "# Get all the required credentials from Azure Key Vault\n",
-    "credential = AzureCliCredential() if USE_CLI_AUTH else DefaultAzureCredential()\n",
-    "secret_client = SecretClient(vault_url=KEY_VAULT_URI, credential=credential)\n",
-    "retrieved_secret = secret_client.get_secret('FEATHR-ONLINE-STORE-CONN').value"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Redis credential\n",
-    "os.environ['REDIS_PASSWORD'] = retrieved_secret.split(\",\")[1].split(\"password=\", 1)[1]\n",
-    "\n",
-    "if SPARK_CLUSTER == \"local\":\n",
-    "    os.environ['SPARK_LOCAL_IP'] = \"127.0.0.1\"\n",
-    "\n",
-    "elif SPARK_CLUSTER == \"databricks\" and is_databricks():\n",
-    "    ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n",
-    "    databricks_config = {\n",
-    "        'run_name': \"FEATHR_FILL_IN\",\n",
-    "        'existing_cluster_id': ctx.tags().get('clusterId').get(),\n",
-    "        'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n",
-    "        'spark_jar_task': {\n",
-    "            'main_class_name': \"FEATHR_FILL_IN\",\n",
-    "            'parameters': [\"FEATHR_FILL_IN\"],\n",
-    "        },\n",
-    "    }\n",
-    "    os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\n",
-    "    os.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\n",
-    "    os.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\n",
-    "    os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "41d3648a-9bc9-40dc-90da-bc82b21ef9b3",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "### Configurations\n",
-    "\n",
-    "Feathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "8cd64e3a-376c-48e6-ba41-5197f3591d48",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n",
-    "\n",
-    "with open(config_path, 'r') as f: \n",
-    "    print(f.read())"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "3fef7f2f-df19-4f53-90a5-ff7999ed983d",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "### Initialize Feathr client"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "9713a2df-c7b2-4562-88b0-b7acce3cc43a",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "client = FeathrClient(config_path=config_path)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "c3b64bda-d42c-4a64-b976-0fb604cf38c5",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "### Prepare the NYC taxi fare dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# To run on a local spark, start a spark session:\n",
-    "if SPARK_CLUSTER == \"local\":\n",
-    "    spark = (\n",
-    "        SparkSession\n",
-    "        .builder\n",
-    "        .appName(\"feathr\")\n",
-    "        .config(\"spark.jars.packages\", \"org.apache.spark:spark-avro_2.12:3.3.0\")\n",
-    "        .config(\"spark.ui.port\", \"8080\")  # Set ui port other than the default one (4040) so that feathr spark job doesn't fail. \n",
-    "        .getOrCreate()\n",
-    "    )\n",
-    "    \n",
-    "# Else, you must already have spark session object available in databricks or synapse."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "c4ccd7b3-298a-4e5a-8eec-b7e309db393e",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n",
-    "\n",
-    "# Download the data file\n",
-    "df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\n",
-    "df_raw.limit(5).toPandas()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "7430c942-64e5-4b70-b823-16ce1d1b3cee",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "### Defining features with Feathr\n",
-    "\n",
-    "In Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n",
-    "\n",
-    "* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n",
-    "* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n",
-    "* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n",
-    "\n",
-    "Note that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n",
-    "\n",
-    "There are two types of features -- anchored features and derivated features:\n",
-    "\n",
-    "* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n",
-    "* **Derived features**: Features that are computed on top of other features.\n",
-    "\n",
-    "#### Define anchored features\n",
-    "\n",
-    "A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "TIMESTAMP_COL = \"lpep_dropoff_datetime\"\n",
-    "TIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "a373ecbe-a040-4cd3-9d87-0d5f4c5ba553",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "# We define f_trip_distance and f_trip_time_duration features separately\n",
-    "# so that we can reuse them later for the derived features.\n",
-    "f_trip_distance = Feature(\n",
-    "    name=\"f_trip_distance\",\n",
-    "    feature_type=FLOAT,\n",
-    "    transform=\"trip_distance\",\n",
-    ")\n",
-    "f_trip_time_duration = Feature(\n",
-    "    name=\"f_trip_time_duration\",\n",
-    "    feature_type=FLOAT,\n",
-    "    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n",
-    ")\n",
-    "\n",
-    "features = [\n",
-    "    f_trip_distance,\n",
-    "    f_trip_time_duration,\n",
-    "    Feature(\n",
-    "        name=\"f_is_long_trip_distance\",\n",
-    "        feature_type=BOOLEAN,\n",
-    "        transform=\"trip_distance > 30.0\",\n",
-    "    ),\n",
-    "    Feature(\n",
-    "        name=\"f_day_of_week\",\n",
-    "        feature_type=INT32,\n",
-    "        transform=\"dayofweek(lpep_dropoff_datetime)\",\n",
-    "    ),\n",
-    "    Feature(\n",
-    "        name=\"f_day_of_month\",\n",
-    "        feature_type=INT32,\n",
-    "        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n",
-    "    ),\n",
-    "    Feature(\n",
-    "        name=\"f_hour_of_day\",\n",
-    "        feature_type=INT32,\n",
-    "        transform=\"hour(lpep_dropoff_datetime)\",\n",
-    "    ),\n",
-    "]\n",
-    "\n",
-    "# After you have defined features, bring them together to build the anchor to the source.\n",
-    "feature_anchor = FeatureAnchor(\n",
-    "    name=\"feature_anchor\",\n",
-    "    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n",
-    "    features=features,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We can define the source with a preprocessing python function."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def preprocessing(df: DataFrame) -> DataFrame:\n",
-    "    import pyspark.sql.functions as F\n",
-    "    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n",
-    "    return df\n",
-    "\n",
-    "batch_source = HdfsSource(\n",
-    "    name=\"nycTaxiBatchSource\",\n",
-    "    path=DATA_FILE_PATH,\n",
-    "    event_timestamp_column=TIMESTAMP_COL,\n",
-    "    preprocessing=preprocessing,\n",
-    "    timestamp_format=TIMESTAMP_FORMAT,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "For the features with aggregation, the supported functions are as follows:\n",
-    "\n",
-    "| Aggregation Function | Input Type | Description |\n",
-    "| --- | --- | --- |\n",
-    "|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n",
-    "|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n",
-    "|LATEST| Any |Returns the latest not-null values from within the defined time window |"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "agg_key = TypedKey(\n",
-    "    key_column=\"DOLocationID\",\n",
-    "    key_column_type=ValueType.INT32,\n",
-    "    description=\"location id in NYC\",\n",
-    "    full_name=\"nyc_taxi.location_id\",\n",
-    ")\n",
-    "\n",
-    "agg_window = \"90d\"\n",
-    "\n",
-    "# Anchored features with aggregations\n",
-    "agg_features = [\n",
-    "    Feature(\n",
-    "        name=\"f_location_avg_fare\",\n",
-    "        key=agg_key,\n",
-    "        feature_type=FLOAT,\n",
-    "        transform=WindowAggTransformation(\n",
-    "            agg_expr=\"fare_amount_cents\",\n",
-    "            agg_func=\"AVG\",\n",
-    "            window=agg_window,\n",
-    "        ),\n",
-    "    ),\n",
-    "    Feature(\n",
-    "        name=\"f_location_max_fare\",\n",
-    "        key=agg_key,\n",
-    "        feature_type=FLOAT,\n",
-    "        transform=WindowAggTransformation(\n",
-    "            agg_expr=\"fare_amount_cents\",\n",
-    "            agg_func=\"MAX\",\n",
-    "            window=agg_window,\n",
-    "        ),\n",
-    "    ),\n",
-    "]\n",
-    "\n",
-    "agg_feature_anchor = FeatureAnchor(\n",
-    "    name=\"agg_feature_anchor\",\n",
-    "    source=batch_source,  # External data source for feature. Typically a data table.\n",
-    "    features=agg_features,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "d2ecaca9-057e-4b36-811f-320f66f753ed",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "#### Define derived features\n",
-    "\n",
-    "We also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "270fb11e-8a71-404f-9639-ad29d8e6a2c1",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "derived_features = [\n",
-    "    DerivedFeature(\n",
-    "        name=\"f_trip_time_distance\",\n",
-    "        feature_type=FLOAT,\n",
-    "        input_features=[\n",
-    "            f_trip_distance,\n",
-    "            f_trip_time_duration,\n",
-    "        ],\n",
-    "        transform=\"f_trip_distance / f_trip_time_duration\",\n",
-    "    )\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "ad102c45-586d-468c-85f0-9454401ef10b",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "### Build features\n",
-    "\n",
-    "Finally, we build the features."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "91bb5ebb-87e4-470b-b8eb-1c89b351740e",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "outputs": [],
-   "source": [
-    "client.build_features(\n",
-    "    anchor_list=[feature_anchor, agg_feature_anchor],\n",
-    "    derived_feature_list=derived_features,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "632d5f46-f9e2-41a8-aab7-34f75206e2aa",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "## 3. Create Training Data Using Point-in-Time Correct Feature Join\n",
-    "\n",
-    "After the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n",
-    "\n",
-    "To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n",
-    "what features and how these features should be joined to the observation data. \n",
-    "\n",
-    "To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "feature_names = [feature.name for feature in features + agg_features + derived_features]\n",
-    "feature_names"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "DATA_FORMAT = \"parquet\"\n",
-    "offline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f",
-     "showTitle": false,
-     "title": ""
-    },
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "# Features that we want to request. Can use a subset of features\n",
-    "query = FeatureQuery(\n",
-    "    feature_list=feature_names,\n",
-    "    key=agg_key,\n",
-    ")\n",
-    "settings = ObservationSettings(\n",
-    "    observation_path=DATA_FILE_PATH,\n",
-    "    event_timestamp_column=TIMESTAMP_COL,\n",
-    "    timestamp_format=TIMESTAMP_FORMAT,\n",
-    ")\n",
-    "client.get_offline_features(\n",
-    "    observation_settings=settings,\n",
-    "    feature_query=query,\n",
-    "    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n",
-    "    execution_configurations=SparkExecutionConfiguration({\n",
-    "        \"spark.feathr.outputFormat\": DATA_FORMAT,\n",
-    "    }),\n",
-    "    output_path=offline_features_path,\n",
-    ")\n",
-    "\n",
-    "client.wait_job_to_finish(timeout_sec=500)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Show feature results\n",
-    "df = get_result_df(\n",
-    "    spark=spark,\n",
-    "    client=client,\n",
-    "    data_format=DATA_FORMAT,\n",
-    "    res_url=offline_features_path,\n",
-    ")\n",
-    "df.select(feature_names).limit(5).toPandas()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "## 4. Train a Prediction Model and Evaluate the Features\n",
-    "\n",
-    "After generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n",
-    "\n",
-    "Note that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "### Load Train and Test Data from the Offline Feature Values"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Train / test split\n",
-    "train_df, test_df = (\n",
-    "    df  # Dataframe that we generated from get_offline_features call.\n",
-    "    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n",
-    "    .where(F.col(\"f_trip_time_duration\") > 0)\n",
-    "    .fillna(0)\n",
-    "    .randomSplit([0.8, 0.2])\n",
-    ")\n",
-    "\n",
-    "print(f\"Num train samples: {train_df.count()}\")\n",
-    "print(f\"Num test samples: {test_df.count()}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "### Build a ML Pipeline\n",
-    "\n",
-    "Here, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Generate a feature vector column for SparkML\n",
-    "vector_assembler = VectorAssembler(\n",
-    "    inputCols=[x for x in df.columns if x in feature_names],\n",
-    "    outputCol=\"features\",\n",
-    ")\n",
-    "\n",
-    "# Define a model\n",
-    "gbt = GBTRegressor(\n",
-    "    featuresCol=\"features\",\n",
-    "    maxIter=100,\n",
-    "    maxDepth=5,\n",
-    "    maxBins=16,\n",
-    ")\n",
-    "\n",
-    "# Create a ML pipeline\n",
-    "ml_pipeline = Pipeline(stages=[\n",
-    "    vector_assembler,\n",
-    "    gbt,\n",
-    "])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "### Train and Evaluate the Model"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Train a model\n",
-    "model = ml_pipeline.fit(train_df)\n",
-    "\n",
-    "# Make predictions\n",
-    "predictions = model.transform(test_df)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Evaluate\n",
-    "evaluator = RegressionEvaluator(\n",
-    "    labelCol=\"label\",\n",
-    "    predictionCol=\"prediction\",\n",
-    ")\n",
-    "\n",
-    "rmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\n",
-    "mae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\n",
-    "print(f\"RMSE: {rmse}\\nMAE: {mae}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\n",
-    "predictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n",
-    "\n",
-    "predictions_pdf.plot(\n",
-    "    x=\"index\",\n",
-    "    y=[\"label\", \"prediction\"],\n",
-    "    style=['-', ':'],\n",
-    "    figsize=(20, 10),\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "predictions_pdf.plot.scatter(\n",
-    "    x=\"label\",\n",
-    "    y=\"prediction\",\n",
-    "    xlim=(0, 100),\n",
-    "    ylim=(0, 100),\n",
-    "    figsize=(10, 10),\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## 5. Register the Features to Share Across Teams\n",
-    "\n",
-    "You can register your features in the centralized registry and share the corresponding project with other team members who want to consume those features and for further use."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "try:\n",
-    "    client.register_features()\n",
-    "except KeyError:\n",
-    "    # TODO temporarily go around the \"Already exists\" error\n",
-    "    \n",
-    "    client.list_registered_features(project_name=PROJECT_NAME)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "5a226026-1c7b-48db-8f91-88d5c2ddf023",
-     "showTitle": false,
-     "title": ""
-    }
-   },
-   "source": [
-    "## 6. Materialize Feature Values for Online Scoring\n",
-    "\n",
-    "While we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n",
-    "\n",
-    "Note, only the features anchored to offline data source can be materialized."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Get registered features\n",
-    "registered_features_dict = client.get_features_from_registry(PROJECT_NAME)\n",
-    "\n",
-    "observation_feature_names = []\n",
-    "materialized_feature_names = []\n",
-    "\n",
-    "for feature_name, feature in registered_features_dict.items():\n",
-    "    if feature.key[0].key_column == \"NOT_NEEDED\":\n",
-    "        observation_feature_names.append(feature_name)\n",
-    "    else:\n",
-    "        materialized_feature_names.append(feature_name)\n",
-    "        \n",
-    "print(f\"Features that will be extracted directly from the observation: {observation_feature_names}\")\n",
-    "print(\"\")\n",
-    "print(f\"Features that will be extracted from the source data and materialized to online storage: {materialized_feature_names}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Get the last date from the dataset\n",
-    "backfill_timestamp = (\n",
-    "    df_raw\n",
-    "    .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n",
-    "    .agg({TIMESTAMP_COL: \"max\"})\n",
-    "    .collect()[0][0]\n",
-    ")\n",
-    "backfill_timestamp"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "application/vnd.databricks.v1+cell": {
-     "inputWidgets": {},
-     "nuid": "3b924c66-8634-42fe-90f3-c844487d3f75",
-     "showTitle": false,
-     "title": ""
-    },
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n",
-    "\n",
-    "# Time range to materialize\n",
-    "backfill_time = BackfillTime(\n",
-    "    start=backfill_timestamp,\n",
-    "    end=backfill_timestamp,\n",
-    "    step=timedelta(days=1),\n",
-    ")\n",
-    "\n",
-    "# Destinations:\n",
-    "# For online store,\n",
-    "redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n",
-    "\n",
-    "# For offline store,\n",
-    "# adls_sink = HdfsSink(output_path=)\n",
-    "\n",
-    "settings = MaterializationSettings(\n",
-    "    name=FEATURE_TABLE_NAME + \".job\",  # job name\n",
-    "    backfill_time=backfill_time,\n",
-    "    sinks=[redis_sink],  # or adls_sink\n",
-    "    feature_names=materialized_feature_names,\n",
-    ")\n",
-    "\n",
-    "client.materialize_features(\n",
-    "    settings=settings,\n",
-    "    execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n",
-    ")\n",
-    "\n",
-    "client.wait_job_to_finish(timeout_sec=500)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now, you can retrieve features for online scoring as follows:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Note, to get a single key, you may use client.get_online_features instead\n",
-    "materialized_feature_values = client.multi_get_online_features(\n",
-    "    feature_table=FEATURE_TABLE_NAME,\n",
-    "    keys=[\"239\", \"265\"],\n",
-    "    feature_names=materialized_feature_names,\n",
-    ")\n",
-    "materialized_feature_values"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Cleanup"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# TODO: Unregister or any other cleanups."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Stop the spark session if it is a local session.\n",
-    "if is_jupyter():\n",
-    "    spark.stop()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Scrap Variables for Testing"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "if SCRAP_RESULTS:\n",
-    "    # Record results for test pipelines\n",
-    "    import scrapbook as sb\n",
-    "    sb.glue(\"materialized_feature_values\", materialized_feature_values)\n",
-    "    sb.glue(\"rmse\", rmse)\n",
-    "    sb.glue(\"mae\", mae)"
-   ]
-  }
- ],
- "metadata": {
-  "application/vnd.databricks.v1+notebook": {
-   "dashboards": [],
-   "language": "python",
-   "notebookMetadata": {
-    "pythonIndentUnit": 4
-   },
-   "notebookName": "nyc_driver_demo",
-   "notebookOrigID": 930353059183053,
-   "widgets": {}
-  },
-  "celltoolbar": "Tags",
-  "kernelspec": {
-   "display_name": "Python 3.10.4 ('feathr')",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.4"
-  },
-  "vscode": {
-   "interpreter": {
-    "hash": "ddb0e38f168d5afaa0b8ab4851ddd8c14364f1d087c15de6ff2ee5a559aec1f2"
-   }
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 1
-}
diff --git a/feathr_project/feathr/client.py b/feathr_project/feathr/client.py
index dd39a70fa..b14bf868e 100644
--- a/feathr_project/feathr/client.py
+++ b/feathr_project/feathr/client.py
@@ -486,7 +486,7 @@ def _get_offline_features_with_config(self,
         job_tags = {OUTPUT_PATH_TAG:feature_join_job_params.job_output_path}
         # set output format in job tags if it's set by user, so that it can be used to parse the job result in the helper function
         if execution_configurations is not None and OUTPUT_FORMAT in execution_configurations:
-            job_tags[OUTPUT_FORMAT] = execution_configurations[OUTPUT_FORMAT]
+            job_tags[OUTPUT_FORMAT]= execution_configurations[OUTPUT_FORMAT]
         '''
         - Job tags are for job metadata and it's not passed to the actual spark job (i.e. not visible to spark job), more like a platform related thing that Feathr want to add (currently job tags only have job output URL and job output format, ). They are carried over with the job and is visible to every Feathr client. Think this more like some customized metadata for the job which would be weird to be put in the spark job itself.
         - Job arguments (or sometimes called job parameters)are the arguments which are command line arguments passed into the actual spark job. This is usually highly related with the spark job. In Feathr it's like the input to the scala spark CLI. They are usually not spark specific (for example if we want to specify the location of the feature files, or want to
diff --git a/feathr_project/feathr/datasets/__init__.py b/feathr_project/feathr/datasets/__init__.py
deleted file mode 100644
index a1e2e5bf3..000000000
--- a/feathr_project/feathr/datasets/__init__.py
+++ /dev/null
@@ -1,9 +0,0 @@
-"""Utilities for downloading sample datasets"""
-
-from feathr.datasets.constants import (
-    NYC_TAXI_SMALL_URL
-)
-
-__all__ = [
-    "NYC_TAXI_SMALL_URL",
-]
diff --git a/feathr_project/feathr/datasets/constants.py b/feathr_project/feathr/datasets/constants.py
deleted file mode 100644
index 849865570..000000000
--- a/feathr_project/feathr/datasets/constants.py
+++ /dev/null
@@ -1,3 +0,0 @@
-NYC_TAXI_SMALL_URL = (
-    "https://azurefeathrstorage.blob.core.windows.net/public/sample_data/green_tripdata_2020-04_with_index.csv"
-)
diff --git a/feathr_project/feathr/datasets/nyc_taxi.py b/feathr_project/feathr/datasets/nyc_taxi.py
deleted file mode 100644
index ec605aae6..000000000
--- a/feathr_project/feathr/datasets/nyc_taxi.py
+++ /dev/null
@@ -1,87 +0,0 @@
-from pathlib import Path
-from tempfile import TemporaryDirectory
-from threading import local
-from urllib.parse import urlparse
-
-import pandas as pd
-from pyspark.sql import DataFrame, SparkSession
-
-from feathr.datasets import NYC_TAXI_SMALL_URL
-from feathr.datasets.utils import maybe_download
-from feathr.utils.platform import is_databricks
-
-
-def get_pandas_df(
-    local_cache_path: str = None,
-) -> pd.DataFrame:
-    """Get NYC taxi fare prediction data samples as a pandas DataFrame.
-
-    Refs:
-        https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page
-
-    Args:
-        local_cache_path (optional): Local cache file path to download the data set.
-            If local_cache_path is a directory, the source file name will be added.
-
-    Returns:
-        pandas DataFrame
-    """
-    # if local_cache_path params is not provided then create a temporary folder
-    if local_cache_path is None:
-        local_cache_path = TemporaryDirectory().name
-
-    # If local_cache_path is a directory, add the source file name.
-    src_filepath = Path(urlparse(NYC_TAXI_SMALL_URL).path)
-    dst_path = Path(local_cache_path)
-    if dst_path.suffix != src_filepath.suffix:
-        local_cache_path = str(dst_path.joinpath(src_filepath.name))
-
-    maybe_download(src_url=NYC_TAXI_SMALL_URL, dst_filepath=local_cache_path)
-
-    pdf = pd.read_csv(local_cache_path)
-
-    return pdf
-
-
-def get_spark_df(
-    spark: SparkSession,
-    local_cache_path: str,
-) -> DataFrame:
-    """Get NYC taxi fare prediction data samples as a spark DataFrame.
-
-    Refs:
-        https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page
-
-    Args:
-        spark: Spark session.
-        local_cache_path: Local cache file path to download the data set.
-            If local_cache_path is a directory, the source file name will be added.
-
-    Returns:
-        Spark DataFrame
-    """
-    # In spark, local_cache_path should be a persist directory or file path
-    if local_cache_path is None:
-        raise ValueError("In spark, `local_cache_path` should be a persist directory or file path.")
-
-    # If local_cache_path is a directory, add the source file name.
-    src_filepath = Path(urlparse(NYC_TAXI_SMALL_URL).path)
-    dst_path = Path(local_cache_path)
-    if dst_path.suffix != src_filepath.suffix:
-        local_cache_path = str(dst_path.joinpath(src_filepath.name))
-
-    if is_databricks():
-        # Databricks uses "dbfs:/" prefix for spark paths
-        if not local_cache_path.startswith("dbfs:"):
-            local_cache_path = str(Path("dbfs:", local_cache_path.lstrip("/")))
-        # Databricks uses "/dbfs/" prefix for python paths
-        python_local_cache_path = local_cache_path.replace("dbfs:", "/dbfs")
-    # TODO add "if is_synapse()"
-    else:
-        python_local_cache_path = local_cache_path
-
-    maybe_download(src_url=NYC_TAXI_SMALL_URL, dst_filepath=python_local_cache_path)
-
-    df = spark.read.option("header", True).csv(local_cache_path)
-
-    return df
diff --git a/feathr_project/feathr/datasets/utils.py b/feathr_project/feathr/datasets/utils.py
deleted file mode 100644
index 5dcfb6e87..000000000
--- a/feathr_project/feathr/datasets/utils.py
+++ /dev/null
@@ -1,64 +0,0 @@
-"""Dataset utilities
-"""
-import logging
-import math
-from pathlib import Path
-import requests
-from urllib.parse import urlparse
-
-from tqdm import tqdm
-
-
-log = logging.getLogger(__name__)
-
-
-def maybe_download(src_url: str, dst_filepath: str, expected_bytes=None) -> bool:
-    """Check if file exists. If not, download and return True. Else, return False.
-
-    Refs:
-        https://github.com/microsoft/recommenders/blob/main/recommenders/datasets/download_utils.py
-
-    Args:
-        src_url: Source file URL.
-        dst_filepath: Destination file path.
-        expected_bytes (optional): Expected bytes of the file to verify.
-
-    Returns:
-        bool: Whether the file was downloaded or not
-    """
-    dst_filepath = Path(dst_filepath)
-
-    if dst_filepath.is_file():
-        log.info(f"File {str(dst_filepath)} already exists")
-        return False
-
-    # Check dir if exists. If not, create one
-    dst_filepath.parent.mkdir(parents=True, exist_ok=True)
-
-    response = requests.get(src_url, stream=True)
-    if response.status_code == 200:
-        log.info(f"Downloading {src_url}")
-        total_size = int(response.headers.get("content-length", 0))
-        block_size = 1024
-        num_iterables = math.ceil(total_size / block_size)
-        with open(str(dst_filepath.resolve()), "wb") as file:
-            for data in tqdm(
-                response.iter_content(block_size),
-                total=num_iterables,
-                unit="KB",
-                unit_scale=True,
-            ):
-                file.write(data)
-
-        # Verify the file size
-        if expected_bytes is not None and expected_bytes != dst_filepath.stat().st_size:
-            # Delete the file since the size is not the same as the expected one.
-            dst_filepath.unlink()
-            raise IOError(f"Failed to verify {str(dst_filepath)}. Maybe interrupted while downloading?")
-        else:
-            return True
-
-    else:
-        response.raise_for_status()
-        # If not HTTPError yet still cannot download
-        raise Exception(f"Problem downloading {src_url}")
diff --git a/feathr_project/feathr/spark_provider/_databricks_submission.py b/feathr_project/feathr/spark_provider/_databricks_submission.py
index cc587e999..cfff0180e 100644
--- a/feathr_project/feathr/spark_provider/_databricks_submission.py
+++ b/feathr_project/feathr/spark_provider/_databricks_submission.py
@@ -1,65 +1,67 @@
-from collections import namedtuple
+from ast import Raise
 import copy
 import json
 import os
+import time
+from collections import namedtuple
 from os.path import basename
 from pathlib import Path
-import time
-from typing import Dict, List, Optional, Union
+from typing import Any, Dict, List, Optional, Union
 from urllib.parse import urlparse
 from urllib.request import urlopen
 
+import requests
 from databricks_cli.dbfs.api import DbfsApi
 from databricks_cli.runs.api import RunsApi
 from databricks_cli.sdk.api_client import ApiClient
-from loguru import logger
-import requests
-from requests.structures import CaseInsensitiveDict
-
 from feathr.constants import *
 from feathr.spark_provider._abc import SparkJobLauncher
+from loguru import logger
+from requests.structures import CaseInsensitiveDict
 
 
 class _FeathrDatabricksJobLauncher(SparkJobLauncher):
     """Class to interact with Databricks Spark cluster
-    This is a light-weight databricks job runner, users should use the provided template json string to get more fine controlled environment for databricks cluster.
-    For example, user can control whether to use a new cluster to run the job or not, specify the cluster ID, running frequency, node size, workder no., whether to send out failed notification email, etc.
-    This runner will only fill in necessary arguments in the JSON template.
-
-    This class will read from the provided configs string, and do the following steps.
-    This default template can be overwritten by users, but users need to make sure the template is compatible with the default template. Specifically:
-    1. it's a SparkJarTask (rather than other types of jobs, say NotebookTask or others). See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details
-    2. Use the Feathr Jar to run the job (hence will add an entry in `libraries` section)
-    3. Will override `main_class_name` and `parameters` field in the JSON template `spark_jar_task` field
-    4. will override the name of this job
-
-    Args:
-        workspace_instance_url (str): the workinstance url. Document to get workspace_instance_url: https://docs.microsoft.com/en-us/azure/databricks/workspace/workspace-details#workspace-url
-        token_value (str): see here on how to get tokens: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/authentication
-        config_template (str): config template for databricks cluster. See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details.
-        databricks_work_dir (_type_, optional): databricks_work_dir must start with dbfs:/. Defaults to 'dbfs:/feathr_jobs'.
-    """
+        This is a light-weight databricks job runner, users should use the provided template json string to get more fine controlled environment for databricks cluster.
+        For example, user can control whether to use a new cluster to run the job or not, specify the cluster ID, running frequency, node size, workder no., whether to send out failed notification email, etc.
+        This runner will only fill in necessary arguments in the JSON template.
+
+        This class will read from the provided configs string, and do the following steps.
+        This default template can be overwritten by users, but users need to make sure the template is compatible with the default template. Specifically:
+        1. it's a SparkJarTask (rather than other types of jobs, say NotebookTask or others). See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details
+        2. Use the Feathr Jar to run the job (hence will add an entry in `libraries` section)
+        3. Only supports `new_cluster` type for now
+        4. Will override `main_class_name` and `parameters` field in the JSON template `spark_jar_task` field
+        5. will override the name of this job
 
+        Args:
+            workspace_instance_url (str): the workinstance url. Document to get workspace_instance_url: https://docs.microsoft.com/en-us/azure/databricks/workspace/workspace-details#workspace-url
+            token_value (str): see here on how to get tokens: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/authentication
+            config_template (str): config template for databricks cluster. See https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runs-submit for more details.
+            databricks_work_dir (_type_, optional): databricks_work_dir must start with dbfs:/. Defaults to 'dbfs:/feathr_jobs'.
+        """
     def __init__(
-        self,
-        workspace_instance_url: str,
-        token_value: str,
-        config_template: Union[str, Dict],
-        databricks_work_dir: str = "dbfs:/feathr_jobs",
+            self,
+            workspace_instance_url: str,
+            token_value: str,
+            config_template: Union[str,Dict],
+            databricks_work_dir: str = 'dbfs:/feathr_jobs',
     ):
+
+
         # Below we will use Databricks job APIs (as well as many other APIs) to submit jobs or transfer files
         # For Job APIs, see https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs
         # for DBFS APIs, see: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/dbfs
         self.config_template = config_template
         # remove possible trailing '/' due to wrong input format
-        self.workspace_instance_url = workspace_instance_url.rstrip("/")
+        self.workspace_instance_url = workspace_instance_url.rstrip('/')
         self.auth_headers = CaseInsensitiveDict()
 
         # Authenticate the REST APIs. Documentation: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/authentication
-        self.auth_headers["Accept"] = "application/json"
-        self.auth_headers["Authorization"] = f"Bearer {token_value}"
+        self.auth_headers['Accept'] = 'application/json'
+        self.auth_headers['Authorization'] = f'Bearer {token_value}'
         self.databricks_work_dir = databricks_work_dir
-        self.api_client = ApiClient(host=self.workspace_instance_url, token=token_value)
+        self.api_client = ApiClient(host=self.workspace_instance_url,token=token_value)
 
     def upload_or_get_cloud_path(self, local_path_or_http_path: str):
         """
@@ -75,7 +77,7 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
             with urlopen(local_path_or_http_path) as f:
                 # use REST API to avoid local temp file
                 data = f.read()
-                files = {"file": data}
+                files = {'file': data}
                 # for DBFS APIs, see: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/latest/dbfs
                 r = requests.post(url=self.workspace_instance_url+'/api/2.0/dbfs/put',
                                   headers=self.auth_headers, files=files,  data={'overwrite': 'true', 'path': cloud_dest_path})
@@ -88,12 +90,8 @@ def upload_or_get_cloud_path(self, local_path_or_http_path: str):
             cloud_dest_path = local_path_or_http_path
         elif src_parse_result.scheme.startswith(('wasb','s3','gs')):
             # if the path starts with a location that's not a local path
-            logger.error(
-                "File {} cannot be downloaded. Please upload the file to dbfs manually.", local_path_or_http_path
-            )
-            raise RuntimeError(
-                f"File {local_path_or_http_path} cannot be downloaded. Please upload the file to dbfs manually."
-            )
+            logger.error("File {} cannot be downloaded. Please upload the file to dbfs manually.", local_path_or_http_path)
+            raise RuntimeError(f"File {local_path_or_http_path} cannot be downloaded. Please upload the file to dbfs manually.")
         else:
             # else it should be a local file path or dir
             if os.path.isdir(local_path_or_http_path):
@@ -124,18 +122,7 @@ def _upload_local_file_to_workspace(self, local_path: str) -> str:
             raise RuntimeError(f"The source path: {local_path}, or the destination path: {cloud_dest_path}, is/are not valid.") from e
         return cloud_dest_path
 
-    def submit_feathr_job(
-        self,
-        job_name: str,
-        main_jar_path: str,
-        main_class_name: str,
-        arguments: List[str],
-        python_files: List[str],
-        reference_files_path: List[str] = [],
-        job_tags: Dict[str, str] = None,
-        configuration: Dict[str, str] = {},
-        properties: Dict[str, str] = {},
-    ):
+    def submit_feathr_job(self, job_name: str, main_jar_path: str,  main_class_name: str, arguments: List[str], python_files: List[str], reference_files_path: List[str] = [], job_tags: Dict[str, str] = None, configuration: Dict[str, str] = {}, properties: Dict[str, str] = {}):
         """
         submit the feathr job to databricks
         Refer to the databricks doc for more details on the meaning of the parameters:
@@ -159,93 +146,72 @@ def submit_feathr_job(
             # otherwise users might have missed the quotes in the config. Treat them as dict
             # Note that we need to use deep copy here, in order to make `self.config_template` immutable
             # Otherwise, since we need to change submission_params later, which will modify `self.config_template` and cause unexpected behaviors
-            submission_params = copy.deepcopy(self.config_template)
-
-        submission_params["run_name"] = job_name
-        cfg = configuration.copy()
-        if "existing_cluster_id" in submission_params:
-            logger.info("Using an existing general purpose cluster to run the feathr job...")
-            if cfg:
-                logger.warning(
-                    "Spark execution configuration will be ignored. To use job-specific spark configs, please use a new job cluster or set the configs via Databricks UI."
-                )
-            if job_tags:
-                logger.warning(
-                    "Job tags will be ignored. To assign job tags to the cluster, please use a new job cluster."
-                )
-        elif "new_cluster" in submission_params:
-            logger.info("Using a new job cluster to run the feathr job...")
+            submission_params = copy.deepcopy(self.config_template) 
+
+        submission_params['run_name'] = job_name
+        if 'existing_cluster_id' not in submission_params:
             # if users don't specify existing_cluster_id
             # Solving this issue: Handshake fails trying to connect from Azure Databricks to Azure PostgreSQL with SSL
             # https://docs.microsoft.com/en-us/answers/questions/170730/handshake-fails-trying-to-connect-from-azure-datab.html
-            cfg["spark.executor.extraJavaOptions"] = "-Djava.security.properties="
-            cfg["spark.driver.extraJavaOptions"] = "-Djava.security.properties="
-            submission_params["new_cluster"]["spark_conf"] = cfg
+            configuration['spark.executor.extraJavaOptions'] = '-Djava.security.properties='
+            configuration['spark.driver.extraJavaOptions'] = '-Djava.security.properties='
+            submission_params['new_cluster']['spark_conf'] = configuration
 
             if job_tags:
-                custom_tags = submission_params["new_cluster"].get("custom_tags", {})
+                custom_tags = submission_params['new_cluster'].get('custom_tags', {})
                 for tag, value in job_tags.items():
                     custom_tags[tag] = value
 
-                submission_params["new_cluster"]["custom_tags"] = custom_tags
-        else:
-            # TODO we should fail fast -- maybe check this in config verification while initializing the client.
-            raise ValueError(
-                "No cluster specifications are found. Either 'existing_cluster_id' or 'new_cluster' should be configured via feathr config."
-            )
+                submission_params['new_cluster']['custom_tags'] = custom_tags
 
         # the feathr main jar file is anyway needed regardless it's pyspark or scala spark
         if not main_jar_path:
             logger.info(f"Main JAR file is not set, using default package '{FEATHR_MAVEN_ARTIFACT}' from Maven")
-            submission_params["libraries"][0]["maven"] = {"coordinates": FEATHR_MAVEN_ARTIFACT}
+            submission_params['libraries'][0]['maven'] = { "coordinates": FEATHR_MAVEN_ARTIFACT }
         else:
-            submission_params["libraries"][0]["jar"] = self.upload_or_get_cloud_path(main_jar_path)
+            submission_params['libraries'][0]['jar'] = self.upload_or_get_cloud_path(main_jar_path)
         # see here for the submission parameter definition https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--request-structure-6
         if python_files:
             # this is a pyspark job. definition here: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--sparkpythontask
             # the first file is the pyspark driver code. we only need the driver code to execute pyspark
-            param_and_file_dict = {
-                "parameters": arguments,
-                "python_file": self.upload_or_get_cloud_path(python_files[0]),
-            }
+            param_and_file_dict = {"parameters": arguments, "python_file": self.upload_or_get_cloud_path(python_files[0])}
             # indicates this is a pyspark job
             # `setdefault` method will get the value of the "spark_python_task" item, if the "spark_python_task" item does not exist, insert "spark_python_task" with the value "param_and_file_dict":
-            submission_params.setdefault("spark_python_task", param_and_file_dict)
+            submission_params.setdefault('spark_python_task',param_and_file_dict)
         else:
             # this is a scala spark job
-            submission_params["spark_jar_task"]["parameters"] = arguments
-            submission_params["spark_jar_task"]["main_class_name"] = main_class_name
+            submission_params['spark_jar_task']['parameters'] = arguments
+            submission_params['spark_jar_task']['main_class_name'] = main_class_name
 
         result = RunsApi(self.api_client).submit_run(submission_params)
 
         try:
             # see if we can parse the returned result
-            self.res_job_id = result["run_id"]
+            self.res_job_id = result['run_id']
         except:
-            logger.error(
-                "Submitting Feathr job to Databricks cluster failed. Message returned from Databricks: {}", result
-            )
+            logger.error("Submitting Feathr job to Databricks cluster failed. Message returned from Databricks: {}", result)
             exit(1)
 
         result = RunsApi(self.api_client).get_run(self.res_job_id)
-        self.job_url = result["run_page_url"]
-        logger.info("Feathr job Submitted Successfully. View more details here: {}", self.job_url)
+        self.job_url = result['run_page_url']
+        logger.info('Feathr job Submitted Successfully. View more details here: {}', self.job_url)
 
         # return ID as the submission result
         return self.res_job_id
 
     def wait_for_completion(self, timeout_seconds: Optional[int] = 600) -> bool:
-        """Returns true if the job completed successfully"""
+        """ Returns true if the job completed successfully
+        """
         start_time = time.time()
         while (timeout_seconds is None) or (time.time() - start_time < timeout_seconds):
             status = self.get_status()
-            logger.debug("Current Spark job status: {}", status)
+            logger.debug('Current Spark job status: {}', status)
             # see all the status here:
             # https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runlifecyclestate
             # https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--runresultstate
-            if status in {"SUCCESS"}:
+            if status in {'SUCCESS'}:
                 return True
-            elif status in {"INTERNAL_ERROR", "FAILED", "TIMEDOUT", "CANCELED"}:
+            elif status in {'INTERNAL_ERROR', 'FAILED', 'TIMEDOUT', 'CANCELED'}:
                 result = RunsApi(self.api_client).get_run_output(self.res_job_id)
                 # See here for the returned fields: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--response-structure-8
                 # print out logs and stack trace if the job has failed
@@ -258,14 +224,14 @@ def wait_for_completion(self, timeout_seconds: Optional[int] = 600) -> bool:
             else:
                 time.sleep(30)
         else:
-            raise TimeoutError("Timeout waiting for Feathr job to complete")
+            raise TimeoutError('Timeout waiting for Feathr job to complete')
 
     def get_status(self) -> str:
         assert self.res_job_id is not None
         result = RunsApi(self.api_client).get_run(self.res_job_id)
         # first try to get result state. it might not be available, and if that's the case, try to get life_cycle_state
         # see result structure: https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--response-structure-6
-        res_state = result["state"].get("result_state") or result["state"]["life_cycle_state"]
+        res_state = result['state'].get('result_state') or result['state']['life_cycle_state']
         assert res_state is not None
         return res_state
 
@@ -279,6 +245,7 @@ def get_job_result_uri(self) -> str:
         # in case users call this API even when there's no tags available
         return None if custom_tags is None else custom_tags[OUTPUT_PATH_TAG]
 
+
     def get_job_tags(self) -> Dict[str, str]:
         """Get job tags
 
@@ -289,23 +256,21 @@ def get_job_tags(self) -> Dict[str, str]:
         # For result structure, see https://docs.microsoft.com/en-us/azure/databricks/dev-tools/api/2.0/jobs#--response-structure-6
         result = RunsApi(self.api_client).get_run(self.res_job_id)
 
-        if "new_cluster" in result["cluster_spec"]:
-            custom_tags = result["cluster_spec"]["new_cluster"]["custom_tags"]
+        if 'new_cluster' in result['cluster_spec']:
+            custom_tags = result['cluster_spec']['new_cluster']['custom_tags']
             return custom_tags
         else:
             # this is not a new cluster; it's an existing cluster.
-            logger.warning(
-                "Job tags are not available since you are using an existing Databricks cluster. Consider using 'new_cluster' in databricks configuration."
-            )
+            logger.warning("Job tags are not available since you are using an existing Databricks cluster. Consider using 'new_cluster' in databricks configuration.")
             return None
 
+
     def download_result(self, result_path: str, local_folder: str):
         """
         Supports downloading files from the result folder. Only support paths starts with `dbfs:/` and only support downloading files in one folder (per Spark's design, everything will be in the result folder in a flat manner)
         """
-        if not result_path.startswith("dbfs"):
-            raise RuntimeError(
-                'Currently only paths starting with dbfs is supported for downloading results from a databricks cluster. The path should start with "dbfs:" .'
-            )
+        if not result_path.startswith('dbfs'):
+            raise RuntimeError('Currently only paths starting with dbfs is supported for downloading results from a databricks cluster. The path should start with \"dbfs:\" .')
 
         DbfsApi(self.api_client).cp(recursive=True, overwrite=True, src=result_path, dst=local_folder)
+
diff --git a/feathr_project/feathr/utils/config.py b/feathr_project/feathr/utils/config.py
deleted file mode 100644
index 9a9438567..000000000
--- a/feathr_project/feathr/utils/config.py
+++ /dev/null
@@ -1,61 +0,0 @@
-from tempfile import NamedTemporaryFile
-
-
-FEATHR_CONFIG_TEMPLATE = """
-api_version: 1
-
-project_config:
-  project_name: {project_name}
-
-feature_registry:
-  api_endpoint: 'https://{resource_prefix}webapp.azurewebsites.net/api/v1'
-
-spark_config:
-  # Currently support: 'azure_synapse', 'databricks', and 'local'
-  spark_cluster: {spark_cluster}
-  spark_result_output_parts: '1'
-
-offline_store:
-  wasb:
-    wasb_enabled: true
-
-online_store:
-  # You can skip this part if you don't have Redis and skip materialization later in this notebook.
-  redis:
-    host: '{resource_prefix}redis.redis.cache.windows.net'
-    port: 6380
-    ssl_enabled: true
-"""
-
-
-def generate_config(
-    resource_prefix: str,
-    project_name: str,
-    spark_cluster: str,
-    output_filepath: str = None,
-) -> str:
-    """Generate a feathr config yaml file
-
-    Args:
-        resource_prefix: Resource name prefix.
-        project_name: Project name.
-        spark_cluster: Spark cluster to use. Either 'local', 'databricks', or 'azure_synapse'.
-        output_filepath: Output filepath.
-
-    Returns:
-        str: Generated config file path. output_filepath if provided. Otherwise, NamedTemporaryFile path.
-    """
-
-    conf_str = FEATHR_CONFIG_TEMPLATE.format(
-        resource_prefix=resource_prefix,
-        project_name=project_name,
-        spark_cluster=spark_cluster,
-    )
-
-    if not output_filepath:
-        output_filepath = NamedTemporaryFile(mode="w", delete=False).name
-
-    with open(output_filepath, "w") as conf_file:
-        conf_file.write(conf_str)
-
-    return output_filepath
diff --git a/feathr_project/feathr/utils/job_utils.py b/feathr_project/feathr/utils/job_utils.py
index 815e26c21..6a6bd63c0 100644
--- a/feathr_project/feathr/utils/job_utils.py
+++ b/feathr_project/feathr/utils/job_utils.py
@@ -1,187 +1,77 @@
-import glob
+from feathr.client import FeathrClient
 import os
-from pathlib import Path
-from tempfile import TemporaryDirectory
-from typing import Union
-
+import glob
+from feathr.constants import OUTPUT_FORMAT
 from loguru import logger
 import pandas as pd
+import tempfile
 from pandas.errors import EmptyDataError
-from pyspark.sql import DataFrame, SparkSession
-
-from feathr.client import FeathrClient
-from feathr.constants import OUTPUT_FORMAT
 
 
-def get_result_pandas_df(
-    client: FeathrClient,
-    data_format: str = None,
-    res_url: str = None,
-    local_cache_path: str = None,
-) -> pd.DataFrame:
-    """Download the job result dataset from cloud as a Pandas DataFrame.
 
-    Args:
-        client: Feathr client
-        data_format: Format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`.
-            Default to `avro` if not specified.
-        res_url: Result URL to download files from. Note that this will not block the job so you need to make sure
-            the job is finished and the result URL contains actual data.
-        local_cache_path (optional): Specify the absolute download path. if the user does not provide this,
-            the function will create a temporary directory.
+def get_result_df(client: FeathrClient, format: str = None, res_url: str = None, local_folder: str = None) -> pd.DataFrame:
+    """Download the job result dataset from cloud as a Pandas dataframe to make it easier for the client to read.
 
-    Returns:
-        pandas DataFrame
+    format: format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`. Default to `avro` if not specified.
+    res_url: output URL to download files. Note that this will not block the job so you need to make sure the job is finished and result URL contains actual data.
+    local_folder: optional parameter to specify the absolute download path. if the user does not provide this, function will create a temporary directory and delete it after reading the dataframe.
     """
-    return get_result_df(client, data_format, res_url, local_cache_path)
-
-
-def get_result_spark_df(
-    spark: SparkSession,
-    client: FeathrClient,
-    data_format: str = None,
-    res_url: str = None,
-    local_cache_path: str = None,
-) -> DataFrame:
-    """Download the job result dataset from cloud as a Spark DataFrame.
-
-    Args:
-        spark: Spark session
-        client: Feathr client
-        data_format: Format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`.
-            Default to `avro` if not specified.
-        res_url: Result URL to download files from. Note that this will not block the job so you need to make sure
-            the job is finished and the result URL contains actual data.
-        local_cache_path (optional): Specify the absolute download path. if the user does not provide this,
-            the function will create a temporary directory.
-
-    Returns:
-        Spark DataFrame
-    """
-    return get_result_df(client, data_format, res_url, local_cache_path, spark=spark)
-
-
-def get_result_df(
-    client: FeathrClient,
-    data_format: str = None,
-    res_url: str = None,
-    local_cache_path: str = None,
-    spark: SparkSession = None,
-) -> Union[DataFrame, pd.DataFrame]:
-    """Download the job result dataset from cloud as a Spark DataFrame or pandas DataFrame.
-
-    Args:
-        client: Feathr client
-        data_format: Format to read the downloaded files. Currently support `parquet`, `delta`, `avro`, and `csv`.
-            Default to `avro` if not specified.
-        res_url: Result URL to download files from. Note that this will not block the job so you need to make sure
-            the job is finished and the result URL contains actual data.
-        local_cache_path (optional): Specify the absolute download path. if the user does not provide this,
-            the function will create a temporary directory.
-        spark (optional): Spark session. If provided, the function returns spark Dataframe.
-            Otherwise, it returns pd.DataFrame.
-
-    Returns:
-        Either Spark or pandas DataFrame.
-    """
-    # use a result url if it's provided by the user, otherwise use the one provided by the job
+    # use a result url if it's provided by the user, otherwise use the one provided by the job 
     res_url: str = res_url or client.get_job_result_uri(block=True, timeout_sec=1200)
     if res_url is None:
-        raise RuntimeError(
-            "res_url is None. Please make sure either you provide a res_url or make sure the job finished in FeathrClient has a valid result URI."
-        )
-
-    if client.spark_runtime == "local":
-        if local_cache_path is not None:
-            logger.warning(
-                "In local spark mode, the result files are expected to be stored at a local storage and thus `local_cache_path` argument will be ignored."
-            )
-        local_cache_path = res_url
-    elif client.spark_runtime == "databricks":
-        if res_url.startswith("dbfs:"):
-            logger.warning(
-                "Result files are already in DBFS and thus `local_cache_path` will be ignored."
-            )
-            local_cache_path = res_url
-        else:
-            # if local_cache_path params is not provided then create a temporary folder
-            if local_cache_path is None:
-                # We'll just use the name of a local TemporaryDirectory to cache the data into DBFS.
-                local_cache_path = TemporaryDirectory().name
-
-            # Databricks uses "dbfs:/" prefix for spark paths
-            if not local_cache_path.startswith("dbfs:"):
-                local_cache_path = str(Path("dbfs:", local_cache_path.lstrip("/")))
-    # TODO elif azure_synapse
-
-    if local_cache_path != res_url:
-        logger.info(f"{res_url} files will be downloaded into {local_cache_path}")
-        client.feathr_spark_launcher.download_result(result_path=res_url, local_folder=local_cache_path)
+        raise RuntimeError("res_url is None. Please make sure either you provide a res_url or make sure the job finished in FeathrClient has a valid result URI.")
 
-    # use user provided format, if there isn't one, then otherwise use the one provided by the job;
+    # use user provided format, if there isn't one, then otherwise use the one provided by the job; 
     # if none of them is available, "avro" is the default format.
-    data_format: str = data_format or client.get_job_tags().get(OUTPUT_FORMAT, "")
-    if data_format is None or data_format == "":
-        data_format = "avro"
+    format: str = format or client.get_job_tags().get(OUTPUT_FORMAT, "")
+    if format is None or format == "":
+        format = "avro"
 
-    result_df = None
-
-    if spark is not None:
-        result_df = spark.read.format(data_format).load(local_cache_path)
+    # if local_folder params is not provided then create a temporary folder
+    if local_folder is not None:
+        local_dir_path = local_folder
     else:
-        result_df = _read_files_to_pandas_df(
-            dir_path=local_cache_path.replace("dbfs:", "/dbfs"),  # replace to python path if spark path is provided.
-            data_format=data_format,
-        )
-
-    return result_df
-
-
-def _read_files_to_pandas_df(dir_path: str, data_format: str = "avro") -> pd.DataFrame:
-
-    if data_format == "parquet":
+        tmp_dir = tempfile.TemporaryDirectory()
+        local_dir_path = tmp_dir.name
+        
+    client.feathr_spark_launcher.download_result(result_path=res_url, local_folder=local_dir_path)
+    dataframe_list = []
+    # by default the result are in avro format
+    if format.casefold()=="parquet":
+        files =  glob.glob(os.path.join(local_dir_path, '*.parquet'))
         from pyarrow.parquet import ParquetDataset
-
-        files = glob.glob(os.path.join(dir_path, "*.parquet"))
         ds = ParquetDataset(files)
-        return ds.read().to_pandas()
-
-    elif data_format == "delta":
+        result_df = ds.read().to_pandas()
+    elif format.casefold()=="delta":
         from deltalake import DeltaTable
-
-        delta = DeltaTable(dir_path)
-        # if client.spark_runtime != "azure_synapse":
-        # don't detect for synapse result with Delta as there's a problem with underlying system
-        # Issues are tracked here: https://github.com/delta-io/delta-rs/issues/582
-        return delta.to_pyarrow_table().to_pandas()
-        # else:
-        # TODO -- Proper warning messages. Is this applied to all the other formats?
-        # raise RuntimeError(
-        #     "Please use Azure Synapse to read the result in the Azure Synapse cluster. Reading local results is not supported for Azure Synapse."
-        # )
-
-    elif data_format == "avro":
+        delta = DeltaTable(local_dir_path)
+        if not client.spark_runtime == 'azure_synapse':
+            # don't detect for synapse result with Delta as there's a problem with underlying system
+            # Issues are tracked here: https://github.com/delta-io/delta-rs/issues/582
+            result_df = delta.to_pyarrow_table().to_pandas()
+        else:
+            logger.info("Please use Azure Synapse to read the result in the Azure Synapse cluster. Reading local results is not supported for Azure Synapse. Empty DataFrame is returned.")
+            result_df = pd.DataFrame()
+    elif format.casefold()=="avro":
         import pandavro as pdx
-
-        dataframe_list = [pdx.read_avro(file) for file in glob.glob(os.path.join(dir_path, "*.avro"))]
-        return pd.concat(dataframe_list, axis=0)
-
-    elif data_format == "csv":
-        dataframe_list = []
-        for file in glob.glob(os.path.join(dir_path, "*.csv")):
+        for file in glob.glob(os.path.join(local_dir_path, '*.avro')):
+            dataframe_list.append(pdx.read_avro(file))
+        result_df = pd.concat(dataframe_list, axis=0)
+    elif format.casefold()=="csv":
+        for file in glob.glob(os.path.join(local_dir_path, '*.csv')):
             try:
-                dataframe_list.append(pd.read_csv(file, index_col=None, header=None))
+                df = pd.read_csv(file, index_col=None, header=None)
             except EmptyDataError:
                 # in case there are empty files
-                pass
-
-        if dataframe_list:
-            # Reset index to avoid duplicated indices -- TODO don't we need reset_index when reading avro too?
-            return pd.concat(dataframe_list, axis=0).reset_index(drop=True)
-        else:
-            raise ValueError(f"Empty files in {dir_path}.")
-
+                df = pd.DataFrame()
+            dataframe_list.append(df)
+        result_df = pd.concat(dataframe_list, axis=0)
+        # Reset index to avoid duplicated indices
+        result_df.reset_index(drop=True)
     else:
-        raise ValueError(
-            f"{data_format} is currently not supported in get_result_df. Currently only parquet, delta, avro, and csv are supported, please consider writing a customized function to read the result."
-        )
+        raise RuntimeError(f"{format} is currently not supported in get_result_df. Currently only parquet, delta, avro, and csv are supported, please consider writing a customized function to read the result.")
+
+    
+    if local_folder is None:
+        tmp_dir.cleanup()
+    return result_df
\ No newline at end of file
diff --git a/feathr_project/feathr/utils/platform.py b/feathr_project/feathr/utils/platform.py
deleted file mode 100644
index 8f832f22d..000000000
--- a/feathr_project/feathr/utils/platform.py
+++ /dev/null
@@ -1,45 +0,0 @@
-"""Platform utilities.
-Refs: https://github.com/microsoft/recommenders/blob/main/recommenders/utils/notebook_utils.py
-"""
-from pathlib import Path
-
-
-def is_jupyter() -> bool:
-    """Check if the module is running on Jupyter notebook/console.
-    Note - there might be better way to check if the code is running on a jupyter notebook or not,
-    but this hacky way still works.
-
-    Ref:
-        https://stackoverflow.com/questions/15411967/how-can-i-check-if-code-is-executed-in-the-ipython-notebook
-
-    Returns:
-        bool: True if the module is running on Jupyter notebook or Jupyter console, False otherwise.
-    """
-    try:
-        # Pre-loaded module `get_ipython()` tells you whether you are running inside IPython or not.
-        shell_name = get_ipython().__class__.__name__
-        # `ZMQInteractiveShell` tells you if this is an interactive mode (notebook).
-        if shell_name == "ZMQInteractiveShell":
-            return True
-        else:
-            return False
-    except NameError:
-        return False
-
-
-def is_databricks() -> bool:
-    """Check if the module is running on Databricks.
-
-    Returns:
-        bool: True if the module is running on Databricks notebook, False otherwise.
-    """
-    try:
-        if str(Path(".").resolve()) == "/databricks/driver":
-            return True
-        else:
-            return False
-    except NameError:
-        return False
-
-
-# TODO maybe add is_synapse()
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv
new file mode 100644
index 000000000..ce34f255a
--- /dev/null
+++ b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/green_tripdata_2020-04.csv
@@ -0,0 +1,14 @@
+VendorID,lpep_pickup_datetime,lpep_dropoff_datetime,store_and_fwd_flag,RatecodeID,PULocationID,DOLocationID,passenger_count,trip_distance,fare_amount,extra,mta_tax,tip_amount,tolls_amount,ehail_fee,improvement_surcharge,total_amount,payment_type,trip_type,congestion_surcharge
+2,2021-01-01 00:15:56,2021-01-01 00:19:52,N,1,43,151,1,1.01,5.5,0.5,0.5,0,0,,0.3,6.8,2,1,0
+22,2021-01-01 11:25:59,2021-01-01 11:34:44,N,1,166,239,1,2.53,10,0.5,0.5,2.81,0,,0.3,16.86,1,1,2.75
+23,2021-01-01 00:45:57,2021-01-01 00:51:55,N,1,41,42,1,1.12,6,0.5,0.5,1,0,,0.3,8.3,1,1,0
+24,2020-12-31 23:57:51,2021-01-01 23:04:56,N,1,168,75,1,1.99,8,0.5,0.5,0,0,,0.3,9.3,2,1,0
+25,2021-01-01 17:16:36,2021-01-01 17:16:40,N,2,265,265,3,.00,-52,0,-0.5,0,0,,-0.3,-52.8,3,1,0
+12,2021-01-01 00:16:36,2021-01-01 00:16:40,N,2,265,265,3,.00,52,0,0.5,0,0,,0.3,52.8,2,1,0
+42,2021-01-01 05:19:14,2021-01-01 00:19:21,N,5,265,265,1,.00,180,0,0,36.06,0,,0.3,216.36,1,2,0
+52,2021-01-01 00:26:31,2021-01-01 00:28:50,N,1,75,75,6,.45,3.5,0.5,0.5,0.96,0,,0.3,5.76,1,1,0
+2,2021-01-01 00:57:46,2021-01-01 00:57:57,N,1,225,225,1,.00,2.5,0.5,0.5,0,0,,0.3,3.8,2,1,0
+32,2021-01-01 00:58:32,2021-01-01 01:32:34,N,1,225,265,1,12.19,38,0.5,0.5,2.75,0,,0.3,42.05,1,1,0
+2,2021-01-01 18:39:57,2021-01-01 18:55:25,N,1,74,60,1,5.48,18,0.5,0.5,0,0,,0.3,19.3,2,1,0
+15,2021-01-01 00:51:27,2021-01-01 00:57:20,N,1,42,41,2,.90,6,0.5,0.5,0,0,,0.3,7.3,1,1,0
+15,2021-01-01 00:29:05,2021-01-01 00:29:07,N,5,42,264,1,9.00E-02,10,0,0,2.06,0,,0.3,12.36,1,2,0
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv
new file mode 100644
index 000000000..476ea06f3
--- /dev/null
+++ b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/product_detail_mock_data.csv
@@ -0,0 +1,11 @@
+product_id,category,price,quantity,recent_sold,made_in_state,discount
+1,1,22,100,0,CA,7.5
+2,2,17,300,1,CA,7.5
+3,1,40,0,2,WA,7.5
+4,1,25,100,3,WA,7.5
+5,1,33,0,2,PA,0
+6,2,19,0,2,CA,7.5
+7,2,22,200,1,WA,7.5
+8,2,59,300,0,PA,8.5
+9,0,80,100,1,WA,8.5
+10,0,39,100,0,WA,7.5
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv
new file mode 100644
index 000000000..38fe25ceb
--- /dev/null
+++ b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_observation_mock_data.csv
@@ -0,0 +1,35 @@
+user_id,product_id,event_timestamp,product_rating
+1,1,2021-04-01,4
+1,2,2021-04-01,4
+1,3,2021-04-01,4
+1,4,2021-04-01,4
+1,5,2021-04-01,4
+2,1,2021-04-01,5
+2,2,2021-04-01,5
+2,3,2021-04-01,5
+2,4,2021-04-01,5
+2,5,2021-04-01,5
+3,1,2021-04-01,5
+3,2,2021-04-01,5
+3,3,2021-04-01,5
+3,4,2021-04-01,5
+3,5,2021-04-01,5
+4,1,2021-04-01,1
+4,2,2021-04-01,1
+4,3,2021-04-01,1
+4,4,2021-04-01,1
+4,5,2021-04-01,1
+5,1,2021-04-01,5
+5,2,2021-04-01,5
+6,1,2021-04-01,2
+7,1,2021-04-01,5
+7,2,2021-04-01,5
+7,3,2021-04-01,5
+8,1,2021-04-01,2
+8,2,2021-04-01,2
+8,3,2021-04-01,2
+9,1,2021-04-01,5
+9,2,2021-04-01,5
+9,3,2021-04-01,5
+9,4,2021-04-01,5
+10,1,2021-04-01,3
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv
new file mode 100644
index 000000000..6c38f51d7
--- /dev/null
+++ b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_profile_mock_data.csv
@@ -0,0 +1,11 @@
+user_id,gender,age,gift_card_balance,number_of_credit_cards,state,tax_rate
+1,1,22,100,0,CA,7.5
+2,2,17,300,1,CA,7.5
+3,1,40,0,2,WA,7.5
+4,1,25,100,3,WA,7.5
+5,1,33,0,2,PA,0
+6,2,19,0,2,CA,7.5
+7,2,22,200,1,WA,7.5
+8,2,59,300,0,PA,8.5
+9,0,80,100,1,WA,8.5
+10,0,39,100,0,WA,7.5
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv
new file mode 100644
index 000000000..8c8481d1f
--- /dev/null
+++ b/feathr_project/feathrcli/data/feathr_user_workspace/mockdata/feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/product_recommendation_sample/user_purchase_history_mock_data.csv
@@ -0,0 +1,31 @@
+user_id,purchase_date,purchase_amount
+1,2021-01-01,0.33
+1,2021-03-03,574.35
+1,2021-01-03,796.07
+2,2021-01-04,342.15
+2,2021-03-05,280.46
+2,2021-01-06,664.18
+3,2021-01-07,359.02
+3,2021-01-08,357.12
+3,2021-01-09,845.40
+4,2021-01-10,103.92
+4,2021-02-21,670.12
+4,2021-02-12,698.65
+5,2021-01-13,110.52
+5,2021-01-14,931.72
+5,2021-02-15,388.14
+6,2021-01-16,822.96
+6,2021-01-17,292.39
+6,2021-01-18,524.76
+7,2021-01-19,262.00
+7,2021-03-20,715.94
+7,2021-01-21,345.70
+8,2021-01-22,379.00
+8,2021-01-23,194.96
+8,2021-01-24,862.33
+9,2021-01-25,430.41
+9,2021-01-26,398.72
+9,2021-02-27,158.52
+10,2021-01-28,550.01
+10,2021-03-02,157.88
+10,2021-03-03,528.43
\ No newline at end of file
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb b/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
new file mode 100644
index 000000000..38cec2ca9
--- /dev/null
+++ b/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
@@ -0,0 +1,720 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Feathr Feature Store on Azure Demo Notebook\n",
+        "\n",
+        "This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. It includes these steps:\n",
+        "\n",
+        "\n",
+        "This tutorial demonstrates the key capabilities of Feathr, including:\n",
+        "\n",
+        "1. Install and set up Feathr with Azure\n",
+        "2. Create shareable features with Feathr feature definition configs.\n",
+        "3. Create a training dataset via point-in-time feature join.\n",
+        "4. Compute and write features.\n",
+        "5. Train a model using these features to predict fares.\n",
+        "6. Materialize feature value to online store.\n",
+        "7. Fetch feature value in real-time from online store for online scoring.\n",
+        "\n",
+        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The feature flow is as below:\n",
+        "\n",
+        "![Feature Flow](https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Prerequisite: Use Quick Start Template to Provision Azure Resources\n",
+        "First step is to provision required cloud resources if you want to use Feathr. Feathr provides a python based client to interact with cloud resources.\n",
+        "\n",
+        "Please follow the steps [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html) to provision required cloud resources. Due to the complexity of the possible cloud environment, it is almost impossible to create a script that works for all the use cases. Because of this, [azure_resource_provision.sh](https://github.com/linkedin/feathr/blob/main/docs/how-to-guides/azure_resource_provision.sh) is a full end to end command line to create all the required resources, and you can tailor the script as needed, while [the companion documentation](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html) can be used as a complete guide for using that shell script.\n",
+        "\n",
+        "\n",
+        "![Architecture](https://github.com/linkedin/feathr/blob/main/docs/images/architecture.png?raw=true)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Prerequisite: Install Feathr \n",
+        "\n",
+        "Install Feathr using pip:\n",
+        "\n",
+        "`pip install -U feathr pandavro scikit-learn`"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Prerequisite: Configure the required environment with Feathr Quick Start Template\n",
+        "\n",
+        "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. Run the code below to install Feathr, login to Azure to get the required credentials to access more cloud resources."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**REQUIRED STEP: Fill in the resource prefix when provisioning the resources**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "resource_prefix = \"feathr_resource_prefix\""
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "! pip install feathr azure-cli  pandavro scikit-learn"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Login to Azure with a device code (You will see instructions in the output):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "! az login --use-device-code"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import glob\n",
+        "import os\n",
+        "import tempfile\n",
+        "from datetime import datetime, timedelta\n",
+        "from math import sqrt\n",
+        "\n",
+        "import pandas as pd\n",
+        "import pandavro as pdx\n",
+        "from feathr import FeathrClient\n",
+        "from feathr import BOOLEAN, FLOAT, INT32, ValueType\n",
+        "from feathr import Feature, DerivedFeature, FeatureAnchor\n",
+        "from feathr import BackfillTime, MaterializationSettings\n",
+        "from feathr import FeatureQuery, ObservationSettings\n",
+        "from feathr import RedisSink\n",
+        "from feathr import INPUT_CONTEXT, HdfsSource\n",
+        "from feathr import WindowAggTransformation\n",
+        "from feathr import TypedKey\n",
+        "from sklearn.metrics import mean_squared_error\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "from azure.identity import DefaultAzureCredential\n",
+        "from azure.keyvault.secrets import SecretClient\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Get all the required credentials from Azure KeyVault"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Get all the required credentials from Azure Key Vault\n",
+        "key_vault_name=resource_prefix+\"kv\"\n",
+        "synapse_workspace_url=resource_prefix+\"syws\"\n",
+        "adls_account=resource_prefix+\"dls\"\n",
+        "adls_fs_name=resource_prefix+\"fs\"\n",
+        "purview_name=resource_prefix+\"purview\"\n",
+        "key_vault_uri = f\"https://{key_vault_name}.vault.azure.net\"\n",
+        "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False)\n",
+        "client = SecretClient(vault_url=key_vault_uri, credential=credential)\n",
+        "secretName = \"FEATHR-ONLINE-STORE-CONN\"\n",
+        "retrieved_secret = client.get_secret(secretName).value\n",
+        "\n",
+        "# Get redis credentials; This is to parse Redis connection string.\n",
+        "redis_port=retrieved_secret.split(',')[0].split(\":\")[1]\n",
+        "redis_host=retrieved_secret.split(',')[0].split(\":\")[0]\n",
+        "redis_password=retrieved_secret.split(',')[1].split(\"password=\",1)[1]\n",
+        "redis_ssl=retrieved_secret.split(',')[2].split(\"ssl=\",1)[1]\n",
+        "\n",
+        "# Set the resource link\n",
+        "os.environ['spark_config__azure_synapse__dev_url'] = f'https://{synapse_workspace_url}.dev.azuresynapse.net'\n",
+        "os.environ['spark_config__azure_synapse__pool_name'] = 'spark31'\n",
+        "os.environ['spark_config__azure_synapse__workspace_dir'] = f'abfss://{adls_fs_name}@{adls_account}.dfs.core.windows.net/feathr_project'\n",
+        "os.environ['online_store__redis__host'] = redis_host\n",
+        "os.environ['online_store__redis__port'] = redis_port\n",
+        "os.environ['online_store__redis__ssl_enabled'] = redis_ssl\n",
+        "os.environ['REDIS_PASSWORD']=redis_password\n",
+        "feathr_output_path = f'abfss://{adls_fs_name}@{adls_account}.dfs.core.windows.net/feathr_output'"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Prerequisite: Configure the required environment (Don't need to update if using the above Quick Start Template)\n",
+        "\n",
+        "In the first step (Provision cloud resources), you should have provisioned all the required cloud resources. If you use Feathr CLI to create a workspace, you should have a folder with a file called `feathr_config.yaml` in it with all the required configurations. Otherwise, update the configuration below.\n",
+        "\n",
+        "The code below will write this configuration string to a temporary location and load it to Feathr. Please still refer to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It should also have more explanations on the meaning of each variable."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import tempfile\n",
+        "yaml_config = \"\"\"\n",
+        "# Please refer to https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
+        "api_version: 1\n",
+        "project_config:\n",
+        "  project_name: 'feathr_getting_started'\n",
+        "  required_environment_variables:\n",
+        "    - 'REDIS_PASSWORD'\n",
+        "    - 'AZURE_CLIENT_ID'\n",
+        "    - 'AZURE_TENANT_ID'\n",
+        "    - 'AZURE_CLIENT_SECRET'\n",
+        "offline_store:\n",
+        "  adls:\n",
+        "    adls_enabled: true\n",
+        "  wasb:\n",
+        "    wasb_enabled: true\n",
+        "  s3:\n",
+        "    s3_enabled: false\n",
+        "    s3_endpoint: 's3.amazonaws.com'\n",
+        "  jdbc:\n",
+        "    jdbc_enabled: false\n",
+        "    jdbc_database: 'feathrtestdb'\n",
+        "    jdbc_table: 'feathrtesttable'\n",
+        "  snowflake:\n",
+        "    url: \"dqllago-ol19457.snowflakecomputing.com\"\n",
+        "    user: \"feathrintegration\"\n",
+        "    role: \"ACCOUNTADMIN\"\n",
+        "spark_config:\n",
+        "  spark_cluster: 'azure_synapse'\n",
+        "  spark_result_output_parts: '1'\n",
+        "  azure_synapse:\n",
+        "    dev_url: 'https://feathrazuretest3synapse.dev.azuresynapse.net'\n",
+        "    pool_name: 'spark3'\n",
+        "    workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_getting_started'\n",
+        "    executor_size: 'Small'\n",
+        "    executor_num: 1\n",
+        "  databricks:\n",
+        "    workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net'\n",
+        "    config_template: {'run_name':'','new_cluster':{'spark_version':'9.1.x-scala2.12','node_type_id':'Standard_D3_v2','num_workers':2,'spark_conf':{}},'libraries':[{'jar':''}],'spark_jar_task':{'main_class_name':'','parameters':['']}}\n",
+        "    work_dir: 'dbfs:/feathr_getting_started'\n",
+        "online_store:\n",
+        "  redis:\n",
+        "    host: 'feathrazuretest3redis.redis.cache.windows.net'\n",
+        "    port: 6380\n",
+        "    ssl_enabled: True\n",
+        "feature_registry:\n",
+        "  api_endpoint: \"https://feathr-sql-registry.azurewebsites.net/api/v1\"\n",
+        "\"\"\"\n",
+        "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
+        "with open(tmp.name, \"w\") as text_file:\n",
+        "    text_file.write(yaml_config)\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Setup necessary environment variables (Skip if using the above Quick Start Template)\n",
+        "\n",
+        "You should setup the environment variables in order to run this sample. More environment variables can be set by referring to [feathr_config.yaml](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) and use that as the source of truth. It also has more explanations on the meaning of each variable.\n",
+        "\n",
+        "To run this notebook, for Azure users, you need AZURE_CLIENT_ID, AZURE_TENANT_ID, AZURE_CLIENT_SECRET and REDIS_PASSWORD.\n",
+        "To run this notebook, for Databricks useres, you need DATABRICKS_WORKSPACE_TOKEN_VALUE and REDIS_PASSWORD."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Initialize Feathr Client"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "client = FeathrClient(config_path=tmp.name)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## View the data\n",
+        "\n",
+        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The data is as below"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "pd.read_csv(\"https://azurefeathrstorage.blob.core.windows.net/public/sample_data/green_tripdata_2020-04_with_index.csv\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Defining Features with Feathr\n",
+        "\n",
+        "In Feathr, a feature is viewed as a function, mapping from entity id or key, and timestamp to a feature value. For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/linkedin/feathr/blob/main/docs/concepts/feature-definition.md)\n",
+        "\n",
+        "\n",
+        "1. The typed key (a.k.a. entity id) identifies the subject of feature, e.g. a user id, 123.\n",
+        "2. The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n",
+        "3. The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Note that, in some cases, such as features defined on top of request data, may have no entity key or timestamp.\n",
+        "It is merely a function/transformation executing against request data at runtime.\n",
+        "For example, the day of week of the request, which is calculated by converting the request UNIX timestamp.\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Define Sources Section with UDFs\n",
+        "A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. See the python documentation to get the details on each input column.\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from pyspark.sql import SparkSession, DataFrame\n",
+        "def feathr_udf_day_calc(df: DataFrame) -> DataFrame:\n",
+        "    from pyspark.sql.functions import dayofweek, dayofyear, col\n",
+        "    df = df.withColumn(\"fare_amount_cents\", col(\"fare_amount\")*100)\n",
+        "    return df\n",
+        "\n",
+        "batch_source = HdfsSource(name=\"nycTaxiBatchSource\",\n",
+        "                          path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
+        "                          event_timestamp_column=\"lpep_dropoff_datetime\",\n",
+        "                          preprocessing=feathr_udf_day_calc,\n",
+        "                          timestamp_format=\"yyyy-MM-dd HH:mm:ss\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Define Anchors and Features\n",
+        "A feature is called an anchored feature when the feature is directly extracted from the source data, rather than computed on top of other features. The latter case is called derived feature."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "f_trip_distance = Feature(name=\"f_trip_distance\",\n",
+        "                          feature_type=FLOAT, transform=\"trip_distance\")\n",
+        "f_trip_time_duration = Feature(name=\"f_trip_time_duration\",\n",
+        "                               feature_type=INT32,\n",
+        "                               transform=\"(to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime))/60\")\n",
+        "\n",
+        "features = [\n",
+        "    f_trip_distance,\n",
+        "    f_trip_time_duration,\n",
+        "    Feature(name=\"f_is_long_trip_distance\",\n",
+        "            feature_type=BOOLEAN,\n",
+        "            transform=\"cast_float(trip_distance)>30\"),\n",
+        "    Feature(name=\"f_day_of_week\",\n",
+        "            feature_type=INT32,\n",
+        "            transform=\"dayofweek(lpep_dropoff_datetime)\"),\n",
+        "]\n",
+        "\n",
+        "request_anchor = FeatureAnchor(name=\"request_features\",\n",
+        "                               source=INPUT_CONTEXT,\n",
+        "                               features=features)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Window aggregation features\n",
+        "\n",
+        "For window aggregation features, see the supported fields below:\n",
+        "\n",
+        "Note that the `agg_func` should be any of these:\n",
+        "\n",
+        "| Aggregation Type | Input Type | Description |\n",
+        "| --- | --- | --- |\n",
+        "|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n",
+        "|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n",
+        "|LATEST| Any |Returns the latest not-null values from within the defined time window |\n",
+        "\n",
+        "\n",
+        "After you have defined features and sources, bring them together to build an anchor:\n",
+        "\n",
+        "\n",
+        "Note that if the data source is from the observation data, the `source` section should be `INPUT_CONTEXT` to indicate the source of those defined anchors."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "location_id = TypedKey(key_column=\"DOLocationID\",\n",
+        "                       key_column_type=ValueType.INT32,\n",
+        "                       description=\"location id in NYC\",\n",
+        "                       full_name=\"nyc_taxi.location_id\")\n",
+        "agg_features = [Feature(name=\"f_location_avg_fare\",\n",
+        "                        key=location_id,\n",
+        "                        feature_type=FLOAT,\n",
+        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
+        "                                                          agg_func=\"AVG\",\n",
+        "                                                          window=\"90d\")),\n",
+        "                Feature(name=\"f_location_max_fare\",\n",
+        "                        key=location_id,\n",
+        "                        feature_type=FLOAT,\n",
+        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
+        "                                                          agg_func=\"MAX\",\n",
+        "                                                          window=\"90d\")),\n",
+        "                Feature(name=\"f_location_total_fare_cents\",\n",
+        "                        key=location_id,\n",
+        "                        feature_type=FLOAT,\n",
+        "                        transform=WindowAggTransformation(agg_expr=\"fare_amount_cents\",\n",
+        "                                                          agg_func=\"SUM\",\n",
+        "                                                          window=\"90d\")),\n",
+        "                ]\n",
+        "\n",
+        "agg_anchor = FeatureAnchor(name=\"aggregationFeatures\",\n",
+        "                           source=batch_source,\n",
+        "                           features=agg_features)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Derived Features Section\n",
+        "Derived features are the features that are computed from other features. They could be computed from anchored features, or other derived features."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "f_trip_time_distance = DerivedFeature(name=\"f_trip_time_distance\",\n",
+        "                                      feature_type=FLOAT,\n",
+        "                                      input_features=[\n",
+        "                                          f_trip_distance, f_trip_time_duration],\n",
+        "                                      transform=\"f_trip_distance * f_trip_time_duration\")\n",
+        "\n",
+        "f_trip_time_rounded = DerivedFeature(name=\"f_trip_time_rounded\",\n",
+        "                                     feature_type=INT32,\n",
+        "                                     input_features=[f_trip_time_duration],\n",
+        "                                     transform=\"f_trip_time_duration % 10\")\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "And then we need to build those features so that it can be consumed later. Note that we have to build both the \"anchor\" and the \"derived\" features (which is not anchored to a source)."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "client.build_features(anchor_list=[agg_anchor, request_anchor], derived_feature_list=[\n",
+        "                      f_trip_time_distance, f_trip_time_rounded])"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Create training data using point-in-time correct feature join\n",
+        "\n",
+        "A training dataset usually contains entity id columns, multiple feature columns, event timestamp column and label/target column. \n",
+        "\n",
+        "To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n",
+        "what features and how these features should be joined to the observation data. \n",
+        "\n",
+        "To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "if client.spark_runtime == 'databricks':\n",
+        "    output_path = 'dbfs:/feathrazure_test.avro'\n",
+        "else:\n",
+        "    output_path = feathr_output_path\n",
+        "\n",
+        "\n",
+        "feature_query = FeatureQuery(\n",
+        "    feature_list=[\"f_location_avg_fare\", \"f_trip_time_rounded\", \"f_is_long_trip_distance\", \"f_location_total_fare_cents\"], key=location_id)\n",
+        "settings = ObservationSettings(\n",
+        "    observation_path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
+        "    event_timestamp_column=\"lpep_dropoff_datetime\",\n",
+        "    timestamp_format=\"yyyy-MM-dd HH:mm:ss\")\n",
+        "client.get_offline_features(observation_settings=settings,\n",
+        "                            feature_query=feature_query,\n",
+        "                            output_path=output_path)\n",
+        "client.wait_job_to_finish(timeout_sec=500)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Download the result and show the result\n",
+        "\n",
+        "Let's use the helper function `get_result_df` to download the result and view it:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def get_result_df(client: FeathrClient) -> pd.DataFrame:\n",
+        "    \"\"\"Download the job result dataset from cloud as a Pandas dataframe.\"\"\"\n",
+        "    res_url = client.get_job_result_uri(block=True, timeout_sec=600)\n",
+        "    tmp_dir = tempfile.TemporaryDirectory()\n",
+        "    client.feathr_spark_launcher.download_result(result_path=res_url, local_folder=tmp_dir.name)\n",
+        "    dataframe_list = []\n",
+        "    # assuming the result are in avro format\n",
+        "    for file in glob.glob(os.path.join(tmp_dir.name, '*.avro')):\n",
+        "        dataframe_list.append(pdx.read_avro(file))\n",
+        "    vertical_concat_df = pd.concat(dataframe_list, axis=0)\n",
+        "    tmp_dir.cleanup()\n",
+        "    return vertical_concat_df\n",
+        "\n",
+        "df_res = get_result_df(client)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "df_res"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Train a machine learning model\n",
+        "After getting all the features, let's train a machine learning model with the converted feature by Feathr:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# remove columns\n",
+        "from sklearn.ensemble import GradientBoostingRegressor\n",
+        "final_df = df_res\n",
+        "final_df.drop([\"lpep_pickup_datetime\", \"lpep_dropoff_datetime\",\n",
+        "              \"store_and_fwd_flag\"], axis=1, inplace=True, errors='ignore')\n",
+        "final_df.fillna(0, inplace=True)\n",
+        "final_df['fare_amount'] = final_df['fare_amount'].astype(\"float64\")\n",
+        "\n",
+        "\n",
+        "train_x, test_x, train_y, test_y = train_test_split(final_df.drop([\"fare_amount\"], axis=1),\n",
+        "                                                    final_df[\"fare_amount\"],\n",
+        "                                                    test_size=0.2,\n",
+        "                                                    random_state=42)\n",
+        "model = GradientBoostingRegressor()\n",
+        "model.fit(train_x, train_y)\n",
+        "\n",
+        "y_predict = model.predict(test_x)\n",
+        "\n",
+        "y_actual = test_y.values.flatten().tolist()\n",
+        "rmse = sqrt(mean_squared_error(y_actual, y_predict))\n",
+        "\n",
+        "sum_actuals = sum_errors = 0\n",
+        "\n",
+        "for actual_val, predict_val in zip(y_actual, y_predict):\n",
+        "    abs_error = actual_val - predict_val\n",
+        "    if abs_error < 0:\n",
+        "        abs_error = abs_error * -1\n",
+        "\n",
+        "    sum_errors = sum_errors + abs_error\n",
+        "    sum_actuals = sum_actuals + actual_val\n",
+        "\n",
+        "mean_abs_percent_error = sum_errors / sum_actuals\n",
+        "print(\"Model MAPE:\")\n",
+        "print(mean_abs_percent_error)\n",
+        "print()\n",
+        "print(\"Model Accuracy:\")\n",
+        "print(1 - mean_abs_percent_error)\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Materialize feature value into offline/online storage\n",
+        "\n",
+        "While Feathr can compute the feature value from the feature definition on-the-fly at request time, it can also pre-compute\n",
+        "and materialize the feature value to offline and/or online storage. \n",
+        "\n",
+        "We can push the generated features to the online store like below:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "backfill_time = BackfillTime(start=datetime(\n",
+        "    2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))\n",
+        "redisSink = RedisSink(table_name=\"nycTaxiDemoFeature\")\n",
+        "settings = MaterializationSettings(\"nycTaxiTable\",\n",
+        "                                   backfill_time=backfill_time,\n",
+        "                                   sinks=[redisSink],\n",
+        "                                   feature_names=[\"f_location_avg_fare\", \"f_location_max_fare\"])\n",
+        "\n",
+        "client.materialize_features(settings)\n",
+        "client.wait_job_to_finish(timeout_sec=500)\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We can then get the features from the online store (Redis):\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "## Fetching feature value for online inference\n",
+        "\n",
+        "For features that are already materialized by the previous step, their latest value can be queried via the client's\n",
+        "`get_online_features` or `multi_get_online_features` API."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "res = client.get_online_features('nycTaxiDemoFeature', '265', [\n",
+        "                                 'f_location_avg_fare', 'f_location_max_fare'])"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "client.multi_get_online_features(\"nycTaxiDemoFeature\", [\"239\", \"265\"], [\n",
+        "                                 'f_location_avg_fare', 'f_location_max_fare'])\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Registering and Fetching features\n",
+        "\n",
+        "We can also register the features with an Apache Atlas compatible service, such as Azure Purview, and share the registered features across teams:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "client.register_features()\n",
+        "client.list_registered_features(project_name=\"feathr_getting_started\")"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3.9.5 ('base')",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.9.5"
+    },
+    "vscode": {
+      "interpreter": {
+        "hash": "3d597f4c481aa0f25dceb95d2a0067e73c0966dcbd003d741d821a7208527ecf"
+      }
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/feathr_project/setup.py b/feathr_project/setup.py
index 0a6b38d49..69a99351f 100644
--- a/feathr_project/setup.py
+++ b/feathr_project/setup.py
@@ -3,7 +3,6 @@
 from setuptools import setup, find_packages
 from pathlib import Path
 
-
 # Use the README.md from /docs
 root_path = Path(__file__).resolve().parent.parent
 long_description = (root_path / "docs/README.md").read_text(encoding="utf8")
@@ -16,7 +15,7 @@
     sys.exit(-1)
 
 VERSION = __version__  # noqa
-os.environ["FEATHR_VERSION"] = VERSION
+os.environ["FEATHR_VERSION]"] = VERSION
 
 extras_require=dict(
     dev=[
diff --git a/feathr_project/test/samples/test_notebooks.py b/feathr_project/test/samples/test_notebooks.py
deleted file mode 100644
index 778b157d7..000000000
--- a/feathr_project/test/samples/test_notebooks.py
+++ /dev/null
@@ -1,56 +0,0 @@
-from pathlib import Path
-from tempfile import TemporaryDirectory
-
-import pytest
-try:
-    import papermill as pm
-    import scrapbook as sb
-except ImportError:
-    pass  # disable error while collecting tests for non-notebook environments
-
-
-SAMPLES_DIR = (
-    Path(__file__)
-    .parent     # .../samples
-    .parent     # .../test
-    .parent     # .../feathr_project
-    .parent     # .../feathr (root of the repo)
-    .joinpath("docs", "samples")
-)
-NOTEBOOK_PATHS = {
-    "nyc_taxi_demo": str(SAMPLES_DIR.joinpath("nyc_taxi_demo.ipynb")),
-}
-
-
-@pytest.mark.notebooks
-def test__nyc_taxi_demo(tmp_path):
-    notebook_name = "nyc_taxi_demo"
-
-    output_tmpdir = TemporaryDirectory()
-    output_notebook_path = str(tmp_path.joinpath(f"{notebook_name}.ipynb"))
-
-    pm.execute_notebook(
-        input_path=NOTEBOOK_PATHS[notebook_name],
-        output_path=output_notebook_path,
-        # kernel_name="python3",
-        parameters=dict(
-            RESOURCE_PREFIX="feathrazuretest3",  # Use the test resource group
-            PROJECT_NAME=notebook_name,
-            DATA_STORE_PATH=output_tmpdir.name,
-            SPARK_CLUSTER="local",
-            USE_CLI_AUTH=False,
-            SCRAP_RESULTS=True,
-        ),
-    )
-
-    # Read results from the Scrapbook and assert expected values
-    nb = sb.read_notebook(output_notebook_path)
-    outputs = nb.scraps
-
-    assert outputs["materialized_feature_values"].data["239"] == pytest.approx([5707., 1480.], abs=1.)
-    assert outputs["materialized_feature_values"].data["265"] == pytest.approx([10000., 4160.], abs=1.)
-    assert outputs["rmse"].data == pytest.approx(5., abs=2.)
-    assert outputs["mae"].data == pytest.approx(2., abs=1.)
-
-    # clean up
-    output_tmpdir.cleanup()
diff --git a/feathr_project/test/unit/datasets/test_dataset_utils.py b/feathr_project/test/unit/datasets/test_dataset_utils.py
deleted file mode 100644
index 2aabaa9a1..000000000
--- a/feathr_project/test/unit/datasets/test_dataset_utils.py
+++ /dev/null
@@ -1,53 +0,0 @@
-from pathlib import Path
-from tempfile import TemporaryDirectory
-from urllib.parse import urlparse
-
-import pytest
-
-from feathr.datasets.nyc_taxi import NYC_TAXI_SMALL_URL
-from feathr.datasets.utils import maybe_download
-
-
-@pytest.mark.parametrize(
-    # 3924447 is the nyc_taxi sample data's bytes
-    "expected_bytes", [3924447, None]
-)
-def test__maybe_download(expected_bytes: int):
-    """Test maybe_download utility function w/ nyc_taxi data cached at Azure blob."""
-
-    tmpdir = TemporaryDirectory()
-    dst_filepath = Path(tmpdir.name, "data.csv")
-
-    # Assert the data is downloaded
-    assert maybe_download(
-        src_url=NYC_TAXI_SMALL_URL,
-        dst_filepath=str(dst_filepath),
-        expected_bytes=expected_bytes,
-    )
-
-    # Assert the downloaded file exists.
-    assert dst_filepath.is_file()
-
-    # Assert the data is already exists and thus the function does not download
-    assert not maybe_download(
-        src_url=NYC_TAXI_SMALL_URL,
-        dst_filepath=str(dst_filepath),
-        expected_bytes=expected_bytes,
-    )
-
-    tmpdir.cleanup()
-
-
-def test__maybe_download__raise_exception():
-    """Test maby_download utility function to raise IOError when the expected bytes mismatches."""
-
-    tmpdir = TemporaryDirectory()
-
-    with pytest.raises(IOError):
-        maybe_download(
-            src_url=NYC_TAXI_SMALL_URL,
-            dst_filepath=Path(tmpdir.name, "data.csv").resolve(),
-            expected_bytes=10,
-        )
-
-    tmpdir.cleanup()
diff --git a/feathr_project/test/unit/datasets/test_datasets.py b/feathr_project/test/unit/datasets/test_datasets.py
deleted file mode 100644
index c1ac49a9b..000000000
--- a/feathr_project/test/unit/datasets/test_datasets.py
+++ /dev/null
@@ -1,106 +0,0 @@
-from pathlib import Path
-from unittest.mock import MagicMock
-
-from pyspark.sql import SparkSession
-import pytest
-from pytest_mock import MockerFixture
-
-from feathr.datasets import nyc_taxi
-
-
-TEST_DATASET_DIR = Path(__file__).parent.parent.parent.joinpath("test_user_workspace")
-NYC_TAXI_FILE_PATH = str(TEST_DATASET_DIR.joinpath("green_tripdata_2020-04_with_index.csv").resolve())
-
-
-@pytest.fixture(scope="module")
-def spark() -> SparkSession:
-    """Generate a spark session for tests."""
-    # Set ui port other than the default one (4040) so that feathr spark job may not fail.
-    spark_session = SparkSession.builder.appName("tests").config("spark.ui.port", "8080").getOrCreate()
-    yield spark_session
-    spark_session.stop()
-
-
-@pytest.mark.parametrize(
-    "local_cache_path",
-    [
-        None,  # default temporary directory
-        NYC_TAXI_FILE_PATH,  # full filepath
-        str(Path(NYC_TAXI_FILE_PATH).parent),  # directory
-    ],
-)
-def test__nyc_taxi__get_pandas_df(
-    mocker: MockerFixture,
-    local_cache_path: str,
-):
-    """Test if nyc_taxi.get_pandas_df returns pd.DataFrame. Also check if the proper modules are being called."""
-    # Mock maybe_download and TempDirectory
-    mocked_maybe_download = mocker.patch("feathr.datasets.nyc_taxi.maybe_download")
-    mocked_tmpdir = MagicMock()
-    mocked_tmpdir.name = NYC_TAXI_FILE_PATH
-    mocked_TemporaryDirectory = mocker.patch("feathr.datasets.nyc_taxi.TemporaryDirectory", return_value=mocked_tmpdir)
-
-    pdf = nyc_taxi.get_pandas_df(local_cache_path=local_cache_path)
-    assert len(pdf) == 35612
-
-    # Assert mock called
-    if local_cache_path:
-        mocked_TemporaryDirectory.assert_not_called()
-    else:
-        mocked_TemporaryDirectory.assert_called_once()
-
-    # TODO check this is called w/ file extension added
-    mocked_maybe_download.assert_called_once_with(src_url=nyc_taxi.NYC_TAXI_SMALL_URL, dst_filepath=NYC_TAXI_FILE_PATH)
-
-
-@pytest.mark.parametrize(
-    "local_cache_path", [
-        NYC_TAXI_FILE_PATH,  # full filepath
-        str(Path(NYC_TAXI_FILE_PATH).parent),  # directory
-    ],
-)
-def test__nyc_taxi__get_spark_df(
-    spark,
-    mocker: MockerFixture,
-    local_cache_path: str,
-):
-    """Test if nyc_taxi.get_spark_df returns spark.sql.DataFrame."""
-    # Mock maybe_download
-    mocked_maybe_download = mocker.patch("feathr.datasets.nyc_taxi.maybe_download")
-
-    df = nyc_taxi.get_spark_df(spark=spark, local_cache_path=local_cache_path)
-    assert df.count() == 35612
-
-    mocked_maybe_download.assert_called_once_with(
-        src_url=nyc_taxi.NYC_TAXI_SMALL_URL, dst_filepath=NYC_TAXI_FILE_PATH
-    )
-
-
-@pytest.mark.parametrize(
-    "local_cache_path", [
-        NYC_TAXI_FILE_PATH,  # full filepath
-        str(Path(NYC_TAXI_FILE_PATH).parent),  # directory
-    ],
-)
-def test__nyc_taxi__get_spark_df__with_databricks(
-    mocker: MockerFixture,
-    local_cache_path: str,
-):
-    # Mock maybe_download and spark session
-    mocked_maybe_download = mocker.patch("feathr.datasets.nyc_taxi.maybe_download")
-    mocked_is_databricks = mocker.patch("feathr.datasets.nyc_taxi.is_databricks", return_value=True)
-    mocked_spark = MagicMock(spec=SparkSession)
-
-    nyc_taxi.get_spark_df(spark=mocked_spark, local_cache_path=local_cache_path)
-
-    # Assert mock called with databricks paths
-    mocked_is_databricks.assert_called_once()
-
-    expected_dst_filepath = str(Path("/dbfs", NYC_TAXI_FILE_PATH.lstrip("/")))
-    mocked_maybe_download.assert_called_once_with(
-        src_url=nyc_taxi.NYC_TAXI_SMALL_URL, dst_filepath=expected_dst_filepath
-    )
-
-    mocked_spark.read.option.return_value.csv.assert_called_once_with(
-        str(Path("dbfs:", NYC_TAXI_FILE_PATH.lstrip("/")))
-    )
diff --git a/feathr_project/test/unit/utils/test_config.py b/feathr_project/test/unit/utils/test_config.py
deleted file mode 100644
index 502a3a01d..000000000
--- a/feathr_project/test/unit/utils/test_config.py
+++ /dev/null
@@ -1,31 +0,0 @@
-from pathlib import Path
-from tempfile import NamedTemporaryFile
-
-import pytest
-
-from feathr.utils.config import FEATHR_CONFIG_TEMPLATE, generate_config
-
-
-@pytest.mark.parametrize(
-    "output_filepath", [None, NamedTemporaryFile().name],
-)
-def test__generate_config(output_filepath: str):
-
-    config = FEATHR_CONFIG_TEMPLATE.format(
-        resource_prefix="test_prefix",
-        project_name="test_project",
-        spark_cluster="local",
-    )
-
-    config_filepath = generate_config(
-        resource_prefix="test_prefix",
-        project_name="test_project",
-        spark_cluster="local",
-        output_filepath=output_filepath,
-    )
-
-    if output_filepath:
-        assert output_filepath == config_filepath
-
-    with open(config_filepath, "r") as f:
-        assert config == f.read()

From 2f868efd16319ccef1af51328ba5ae451b5b6016 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Mon, 31 Oct 2022 14:48:26 +0800
Subject: [PATCH 47/68] remove unnecessary spark job from registry test (#790)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 feathr_project/test/test_feature_registry.py | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/feathr_project/test/test_feature_registry.py b/feathr_project/test/test_feature_registry.py
index 5f2fea7d4..86db93440 100644
--- a/feathr_project/test/test_feature_registry.py
+++ b/feathr_project/test/test_feature_registry.py
@@ -59,18 +59,6 @@ def test_feathr_register_features_e2e(self):
                 # Sync workspace from registry, will get all conf files back
                 client.get_features_from_registry(client.project_name)
 
-                feature_query = FeatureQuery(
-                    feature_list=["f_location_avg_fare", "f_trip_time_rounded", "f_is_long_trip_distance"],
-                    key=TypedKey(key_column="DOLocationID",key_column_type=ValueType.INT32))
-                settings = ObservationSettings(
-                    observation_path="wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv",
-                    event_timestamp_column="lpep_dropoff_datetime",
-                    timestamp_format="yyyy-MM-dd HH:mm:ss")
-                client.get_offline_features(observation_settings=settings,
-                                            feature_query=feature_query,
-                                            output_path=output_path)
-                client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
-
     def test_feathr_register_features_partially(self):
         """
         This test will register full set of features into one project, then register another project in two partial registrations.

From 04c417e8ffac3a3a311d94d452397db450791d79 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Mon, 31 Oct 2022 16:01:26 +0800
Subject: [PATCH 48/68] Revert "Expose 'timePartitionPattern' in Python API [
 WIP ] (#714)" (#799)

This reverts commit 3070a863d69f767658ca4adc819f6a3aac71ea18.
---
 feathr_project/feathr/definition/source.py    | 21 +------
 .../spark_provider/_synapse_submission.py     |  2 -
 feathr_project/test/test_azure_spark_e2e.py   | 36 +-----------
 feathr_project/test/test_feature_anchor.py    | 58 +------------------
 feathr_project/test/test_fixture.py           | 28 ---------
 5 files changed, 3 insertions(+), 142 deletions(-)

diff --git a/feathr_project/feathr/definition/source.py b/feathr_project/feathr/definition/source.py
index 3ca8925df..b9721a1a5 100644
--- a/feathr_project/feathr/definition/source.py
+++ b/feathr_project/feathr/definition/source.py
@@ -100,30 +100,14 @@ class HdfsSource(Source):
                                                     - `epoch` (seconds since epoch), for example `1647737463`
                                                     - `epoch_millis` (milliseconds since epoch), for example `1647737517761`
                                                     - Any date formats supported by [SimpleDateFormat](https://docs.oracle.com/javase/8/docs/api/java/text/SimpleDateFormat.html).
-        
         registry_tags: A dict of (str, str) that you can pass to feature registry for better organization. For example, you can use {"deprecated": "true"} to indicate this source is deprecated, etc.
-        time_partition_pattern(Optional[str]): Format of the time partitioned feature data. e.g. yyyy/MM/DD. All formats supported in dateTimeFormatter.
-        config:
-            timeSnapshotHdfsSource: 
-            {  
-                location: 
-                {    
-                    path: "/data/somePath/daily"  
-                }  
-                timePartitionPattern: "yyyy/MM/dd" 
-            }
-        Given the above HDFS path: /data/somePath/daily, 
-        then the expectation is that the following sub directorie(s) should exist:
-        /data/somePath/daily/{yyyy}/{MM}/{dd}
-
     """
 
-    def __init__(self, name: str, path: str, preprocessing: Optional[Callable] = None, event_timestamp_column: Optional[str] = None, timestamp_format: Optional[str] = "epoch", registry_tags: Optional[Dict[str, str]] = None, time_partition_pattern: Optional[str] = None) -> None:
+    def __init__(self, name: str, path: str, preprocessing: Optional[Callable] = None, event_timestamp_column: Optional[str] = None, timestamp_format: Optional[str] = "epoch", registry_tags: Optional[Dict[str, str]] = None) -> None:
         super().__init__(name, event_timestamp_column,
                          timestamp_format, registry_tags=registry_tags)
         self.path = path
         self.preprocessing = preprocessing
-        self.time_partition_pattern = time_partition_pattern
         if path.startswith("http"):
             logger.warning(
                 "Your input path {} starts with http, which is not supported. Consider using paths starting with wasb[s]/abfs[s]/s3.", path)
@@ -132,9 +116,6 @@ def to_feature_config(self) -> str:
         tm = Template("""  
             {{source.name}}: {
                 location: {path: "{{source.path}}"}
-                {% if source.time_partition_pattern %}
-                timePartitionPattern: "{{source.time_partition_pattern}}"
-                {% endif %}
                 {% if source.event_timestamp_column %}
                     timeWindowParameters: {
                         timestampColumn: "{{source.event_timestamp_column}}"
diff --git a/feathr_project/feathr/spark_provider/_synapse_submission.py b/feathr_project/feathr/spark_provider/_synapse_submission.py
index 5b55a3b06..010444715 100644
--- a/feathr_project/feathr/spark_provider/_synapse_submission.py
+++ b/feathr_project/feathr/spark_provider/_synapse_submission.py
@@ -432,8 +432,6 @@ def download_file(self, target_adls_directory: str, local_dir_cache: str):
 
         # returns the paths to all the files in the target director in ADLS
         # get all the paths that are not under a directory
-        test_paths = self.file_system_client.get_paths(
-            path=parse_result.path, recursive=False)
         result_paths = [basename(file_path.name) for file_path in self.file_system_client.get_paths(
             path=parse_result.path, recursive=False) if not file_path.is_directory]
 
diff --git a/feathr_project/test/test_azure_spark_e2e.py b/feathr_project/test/test_azure_spark_e2e.py
index e82e0efe9..9c4ab8c5a 100644
--- a/feathr_project/test/test_azure_spark_e2e.py
+++ b/feathr_project/test/test_azure_spark_e2e.py
@@ -20,7 +20,7 @@
 from feathr import ValueType
 from feathr.utils.job_utils import get_result_df
 from feathrcli.cli import init
-from test_fixture import (basic_test_setup, get_online_test_table_name, time_partition_pattern_test_setup)
+from test_fixture import (basic_test_setup, get_online_test_table_name)
 from test_utils.constants import Constants
 
 # make sure you have run the upload feature script before running these tests
@@ -58,40 +58,6 @@ def test_feathr_materialize_to_offline():
     res_df = get_result_df(client, "avro", output_path + "/df0/daily/2020/05/20")
     assert res_df.shape[0] > 0
 
-def test_feathr_materialize_with_time_partition_pattern():
-    """
-    Test FeathrClient() using HdfsSource with 'timePartitionPattern'.
-    """
-    test_workspace_dir = Path(
-        __file__).parent.resolve() / "test_user_workspace"
-    # os.chdir(test_workspace_dir)
-
-    client: FeathrClient = time_partition_pattern_test_setup(os.path.join(test_workspace_dir, "feathr_config.yaml"))
-
-    backfill_time = BackfillTime(start=datetime(
-        2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))
-
-    now = datetime.now()
-    if client.spark_runtime == 'databricks':
-        output_path = ''.join(['dbfs:/feathrazure_cijob_materialize_offline_','_', str(now.minute), '_', str(now.second), ""])
-    else:
-        output_path = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/feathrazure_cijob_materialize_offline_','_', str(now.minute), '_', str(now.second), ""])
-    offline_sink = HdfsSink(output_path=output_path)
-    settings = MaterializationSettings("nycTaxiTable",
-                                       sinks=[offline_sink],
-                                       feature_names=[
-                                           "f_location_avg_fare", "f_location_max_fare"],
-                                       backfill_time=backfill_time)
-    client.materialize_features(settings)
-    # assuming the job can successfully run; otherwise it will throw exception
-    client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
-
-    # download result and just assert the returned result is not empty
-    # by default, it will write to a folder appended with date
-    res_df = get_result_df(client, "avro", output_path + "/df0/daily/2020/05/20")
-    assert res_df.shape[0] > 0
-
-
 def test_feathr_online_store_agg_features():
     """
     Test FeathrClient() get_online_features and batch_get can get data correctly.
diff --git a/feathr_project/test/test_feature_anchor.py b/feathr_project/test/test_feature_anchor.py
index 1fabeec67..d5e6701b8 100644
--- a/feathr_project/test/test_feature_anchor.py
+++ b/feathr_project/test/test_feature_anchor.py
@@ -167,60 +167,4 @@ def test_agg_anchor_to_config():
                 }
             }
         """
-    assert ''.join(agg_anchor.to_feature_config().split()) == ''.join(expected_agg_feature_config.split())
-
-def test_time_partition_to_config():
-    batch_source = HdfsSource(name="testTimePartitionSource",
-                          path="abfss://public@azurefeathrstorage.blob.core.windows.net/sample_data/time_partition_pattern",
-                          time_partition_pattern="yyyy/MM/dd"
-                          )
-    key = TypedKey(key_column="key0",
-               key_column_type=ValueType.INT32)
-    agg_features = [
-        Feature(name="f_loc_avg",
-            key=[key],
-            feature_type=FLOAT,
-                transform="f_location_avg_fare"),
-        Feature(name="f_loc_max",
-            feature_type=FLOAT,
-            key=[key],
-            transform="f_location_max_fare"),
-        ]
-    agg_anchor = FeatureAnchor(name="testTimePartitionFeaturesSource",
-                           source=batch_source,
-                           features=agg_features)
-    expected_time_partition_config = """
-        anchors: {
-            testTimePartitionFeatures: {
-                source: testTimePartitionSource
-                key.sqlExpr: [key0]
-                features: {
-                    f_loc_avg: {
-                        def.sqlExpr: "f_location_avg_fare"
-                        type: {
-                            type: TENSOR
-                            tensorCategory: DENSE
-                            dimensionType: []
-                            valType: FLOAT
-                        }
-                    }       
-                    f_loc_max: {
-                        def.sqlExpr: "f_location_max_fare"
-                        type: {
-                            type: TENSOR
-                            tensorCategory: DENSE
-                            dimensionType: []
-                            valType: FLOAT
-                        }
-                    }
-                }
-            }
-        }
-        sources: {
-            testTimePartitionSource: {
-                location: {path: "abfss://public@azurefeathrstorage.blob.core.windows.net/sample_data/time_partition_pattern"}
-                timePartitionPattern: "yyyy/MM/dd"
-            }   
-        }
-    """
-    assert ''.join(agg_anchor.to_feature_config().split()) == ''.join(expected_time_partition_config.split())
\ No newline at end of file
+    assert ''.join(agg_anchor.to_feature_config().split()) == ''.join(expected_agg_feature_config.split())
\ No newline at end of file
diff --git a/feathr_project/test/test_fixture.py b/feathr_project/test/test_fixture.py
index 637e74202..c048eff7c 100644
--- a/feathr_project/test/test_fixture.py
+++ b/feathr_project/test/test_fixture.py
@@ -88,34 +88,6 @@ def basic_test_setup(config_path: str):
 
     return client
 
-def time_partition_pattern_test_setup(config_path: str):
-    now = datetime.now()
-    # set workspace folder by time; make sure we don't have write conflict if there are many CI tests running
-    os.environ['SPARK_CONFIG__DATABRICKS__WORK_DIR'] = ''.join(['dbfs:/feathrazure_cijob','_', str(now.minute), '_', str(now.second), '_', str(now.microsecond)]) 
-    os.environ['SPARK_CONFIG__AZURE_SYNAPSE__WORKSPACE_DIR'] = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_github_ci','_', str(now.minute), '_', str(now.second) ,'_', str(now.microsecond)]) 
-    client = FeathrClient(config_path=config_path)
-    batch_source = HdfsSource(name="testTimePartitionSource",
-                          path="wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/time_partition_pattern/daily",
-                          time_partition_pattern="yyyy/MM/dd"
-                          )
-    key = TypedKey(key_column="key0",
-               key_column_type=ValueType.INT32)
-    agg_features = [
-    Feature(name="f_loc_avg",
-            key=[key],
-            feature_type=FLOAT,
-            transform="f_location_avg_fare"),
-    Feature(name="f_loc_max",
-            feature_type=FLOAT,
-            key=[key],
-            transform="f_location_max_fare"),
-    ]
-
-    agg_anchor = FeatureAnchor(name="testTimePartitionFeatures",
-                           source=batch_source,
-                           features=agg_features)
-    client.build_features(anchor_list=[agg_anchor])
-    return client
 
 def snowflake_test_setup(config_path: str):
     now = datetime.now()

From 602b08fb42d2818c561a904a9eec219fb9d79bb4 Mon Sep 17 00:00:00 2001
From: Hangfei Lin <hnlin@linkedin.com>
Date: Mon, 31 Oct 2022 01:56:07 -0700
Subject: [PATCH 49/68] Update CONTRIBUTING.md (#793)

---
 CONTRIBUTING.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 76a01bd06..ec137aa03 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -40,7 +40,11 @@ Our open source community strives to:
 - **Be respectful**: We are a world-wide community of professionals, and we conduct ourselves professionally. Disagreement is no excuse for poor behavior and poor manners.
 - **Understand disagreements**: Disagreements, both social and technical, are useful learning opportunities. Seek to understand the other viewpoints and resolve differences constructively.
 - **Remember that we’re different**. The strength of our community comes from its diversity, people from a wide range of backgrounds. Different people have different perspectives on issues. Being unable to understand why someone holds a viewpoint doesn’t mean that they’re wrong. Focus on helping to resolve issues and learning from mistakes.
+- 
 
 ## Attribution & Acknowledgements
 
 This code of conduct is based on the Open Code of Conduct from the [TODOGroup](https://todogroup.org/blog/open-code-of-conduct/).
+
+# Committers
+Benjamin Le, David Stein, Edwin Cheung, Hangfei Lin, Jimmy Guo, Jinghui Mo, Li Lu, Rama Ramani, Ray Zhang, Xiaoyong Zhu

From 1c958681a89683d693ac5442f05773412c629c21 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Mon, 31 Oct 2022 21:11:18 +0800
Subject: [PATCH 50/68] Fix test_azure_spark_maven_e2e ci test error (#800)

* Fix test_azure_spark_maven_e2e ci test error

* Update test_azure_kafka_e2e.py

* Update test_azure_spark_maven_e2e.py
---
 feathr_project/test/test_azure_kafka_e2e.py       | 2 +-
 feathr_project/test/test_azure_spark_maven_e2e.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/feathr_project/test/test_azure_kafka_e2e.py b/feathr_project/test/test_azure_kafka_e2e.py
index 6c1a9b7d9..f680f695a 100644
--- a/feathr_project/test/test_azure_kafka_e2e.py
+++ b/feathr_project/test/test_azure_kafka_e2e.py
@@ -19,5 +19,5 @@ def test_feathr_kafa_streaming_features():
                                    sinks=[redisSink],
                                    feature_names=['f_modified_streaming_count']
                                    )
-    client.materialize_features(settings)
+    client.materialize_features(settings, allow_materialize_non_agg_feature=True)
     client.wait_job_to_finish(timeout_sec=Constants.SPARK_JOB_TIMEOUT_SECONDS)
diff --git a/feathr_project/test/test_azure_spark_maven_e2e.py b/feathr_project/test/test_azure_spark_maven_e2e.py
index 6b93bb7a8..a2f214020 100644
--- a/feathr_project/test/test_azure_spark_maven_e2e.py
+++ b/feathr_project/test/test_azure_spark_maven_e2e.py
@@ -45,7 +45,7 @@ def test_feathr_online_store_agg_features():
     if client.spark_runtime == 'databricks':
         output_path = ''.join(['dbfs:/feathrazure_cijob','_', str(now.minute), '_', str(now.second), ".avro"])
     else:
-        output_path = ''.join(['abfss://xchfeathrtest4fs@xchfeathrtest4sto.dfs.core.windows.net/demo_data/output','_', str(now.minute), '_', str(now.second), ".avro"])
+        output_path = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/demo_data/output','_', str(now.minute), '_', str(now.second), ".avro"])
 
 
     client.get_offline_features(observation_settings=settings,

From 87baf06eb0fa248df4188e97427b497e2a563240 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Mon, 31 Oct 2022 21:43:50 +0800
Subject: [PATCH 51/68] Add failure warning and run link to daily notification
 (#802)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 .github/workflows/pull_request_push_test.yml | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/pull_request_push_test.yml b/.github/workflows/pull_request_push_test.yml
index 1e65e7a9f..0eb0e059b 100644
--- a/.github/workflows/pull_request_push_test.yml
+++ b/.github/workflows/pull_request_push_test.yml
@@ -257,7 +257,18 @@ jobs:
           # skip cloud related tests
           pytest feathr_project/test/test_local_spark_e2e.py
 
+  failure_notification:
+    # If any failure, warning message will be sent
+    needs: [sbt_test, python_lint, databricks_test, azure_synapse_test, local_spark_test]
+    runs-on: ubuntu-latest
+    if: failure() && github.event_name == 'schedule'
+    steps:
+     - name: Warning
+       run: |
+        curl -H 'Content-Type: application/json' -d '{"text": "[WARNING] Daily CI has failure, please check: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"}' ${{ secrets.TEAMS_WEBHOOK }}
+
   notification:
+    # Final Daily Report with all job status
     needs: [sbt_test, python_lint, databricks_test, azure_synapse_test, local_spark_test]
     runs-on: ubuntu-latest
     if: always() && github.event_name == 'schedule'
@@ -266,4 +277,4 @@ jobs:
         run: echo "NOW=$(date +'%Y-%m-%d')" >> $GITHUB_ENV
       - name: Notification
         run: |
-          curl -H 'Content-Type: application/json' -d '{"text": "${{env.NOW}} Daily Report: 1. SBT Test ${{needs.sbt_test.result}}, 2. Python Lint Test ${{needs.python_lint.result}}, 3. Databricks Test ${{needs.databricks_test.result}}, 4. Synapse Test ${{needs.azure_synapse_test.result}} , 5. LOCAL SPARK TEST ${{needs.local_spark_test.result}}"}' ${{ secrets.TEAMS_WEBHOOK }}
\ No newline at end of file
+          curl -H 'Content-Type: application/json' -d '{"text": "${{env.NOW}} Daily Report: 1. SBT Test ${{needs.sbt_test.result}}, 2. Python Lint Test ${{needs.python_lint.result}}, 3. Databricks Test ${{needs.databricks_test.result}}, 4. Synapse Test ${{needs.azure_synapse_test.result}} , 5. LOCAL SPARK TEST ${{needs.local_spark_test.result}}. Link: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"}' ${{ secrets.TEAMS_WEBHOOK }}
\ No newline at end of file

From a8a88d951e7c778b2aec905252f00206e22bbbf6 Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Mon, 31 Oct 2022 20:12:57 +0530
Subject: [PATCH 52/68] Minor documentation update to add info about maven
 automated workflow (#795)

* Adding DevSkim linter to Github actions

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Update docker-publish.yml

* Removing devskim file

* Restructuring the Prod Reco sample

* Adjusting headings

* Minor changes

* Removing changes to docker publish file

* Addressing PR comments, moving Product recommendation notebook sample to Synapse folder since it is strongly tied to Synapse

* Addressing PR comments

* Fixing images

* Removing the need to pass email id as we could directly compute object Id using az command, also making CLI instructions clearer that it is for advance users

* Fixing typos

* Combining product_reco and product_reco_advanced into one notebook

* Updating release guide with maven automated workflow information

* Removing notebook changes in this PR
---
 docs/dev_guide/feathr_overall_release_guide.md | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/docs/dev_guide/feathr_overall_release_guide.md b/docs/dev_guide/feathr_overall_release_guide.md
index 0a3bfdf2c..d0b16611a 100644
--- a/docs/dev_guide/feathr_overall_release_guide.md
+++ b/docs/dev_guide/feathr_overall_release_guide.md
@@ -47,25 +47,24 @@ Our goal is to automate the release process as much as possible. So far, we have
 
     **Triggers** -  branch with name pattern "releases/*"
 
-1. Automated Maven workflow - Coming soon.
+1. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-maven.yml) for publishing the jar to [maven/sonatype repository](https://oss.sonatype.org/).
 
 **PLEASE NOTE: To trigger the above workflows as part of release, create a new branch with pattern releases/v0.x.0**. See past release branches [here](https://github.com/feathr-ai/feathr/branches/all?query=releases).
 
 
-## Release Maven
-
-See [Developer Guide for publishing to maven](publish_to_maven.md)
-
 ## Upload Feathr Jar
 
 Run the command to generate the Java jar. After the jar is generated, please upload to [Azure storage](https://ms.portal.azure.com/#view/Microsoft_Azure_Storage/ContainerMenuBlade/~/overview/storageAccountId/%2Fsubscriptions%2Fa6c2a7cc-d67e-4a1a-b765-983f08c0423a%2FresourceGroups%2Fazurefeathrintegration%2Fproviders%2FMicrosoft.Storage%2FstorageAccounts%2Fazurefeathrstorage/path/public/etag/%220x8D9E6F64D62D599%22/defaultEncryptionScope/%24account-encryption-key/denyEncryptionScopeOverride//defaultId//publicAccessVal/Container) for faster access.
 
 ## Release PyPi
-The automated workflow should take care of this, you can check under [actions](https://github.com/feathr-ai/feathr/actions/workflows/publish-to-pypi.yml) to see the triggered run and results. For manual steps, see [Python Package Release Note](https://feathr-ai.github.io/feathr/dev_guide/python_package_release.html)
+The automated workflow should take care of this, you can check under [actions](https://github.com/feathr-ai/feathr/actions/workflows/publish-to-pypi.yml) to see the triggered run and results. For manual steps, see [Python Package Release Guide](https://feathr-ai.github.io/feathr/dev_guide/python_package_release.html)
 
 ## Updating docker image for API and Registry
 The automated workflow should take care of this as well, you can check under [actions](https://github.com/feathr-ai/feathr/actions/workflows/docker-publish.yml) to see the triggered run and results. For manual steps, see [Feathr Registry docker image](https://feathr-ai.github.io/feathr/dev_guide/build-and-push-feathr-registry-docker-image.html)
 
+## Release Maven
+The automated workflow should take of this too, you can check under [actions](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-maven.yml) to see the triggered run and results. For manual steps, see [Feathr Developer Guide for publishing to maven](https://feathr-ai.github.io/feathr/dev_guide/publish_to_maven.html)
+
 ## Testing
 Run one of the sample [notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb) as it uses the latest package from Maven and PyPi.
 

From 1cb4a6f168e10481e69b999d5ee61aaefed5bdb8 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@hotmail.com>
Date: Tue, 1 Nov 2022 10:26:40 +0800
Subject: [PATCH 53/68] Update test_azure_spark_e2e.py

---
 feathr_project/test/test_azure_spark_e2e.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/feathr_project/test/test_azure_spark_e2e.py b/feathr_project/test/test_azure_spark_e2e.py
index 9c4ab8c5a..ae7c1cab2 100644
--- a/feathr_project/test/test_azure_spark_e2e.py
+++ b/feathr_project/test/test_azure_spark_e2e.py
@@ -183,7 +183,7 @@ def test_feathr_get_offline_features():
                                full_name="nyc_taxi.location_id")
 
         feature_query = FeatureQuery(
-            feature_list=["f_location_avg_fare"], key=location_id)
+            feature_list=["f_location_avg_fare", "f_trip_time_rounded"], key=location_id)
         settings = ObservationSettings(
             observation_path="wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04.csv",
             event_timestamp_column="lpep_dropoff_datetime",
@@ -309,9 +309,9 @@ def test_feathr_materialize_to_aerospike():
     # os.chdir(test_workspace_dir)
     now = datetime.now()
     # set workspace folder by time; make sure we don't have write conflict if there are many CI tests running
-    os.environ['SPARK_CONFIG__DATABRICKS__WORK_DIR'] = ''.join(['dbfs:/feathrazure_cijob','_', str(now.minute), '_', str(now.second), '_', str(now.microsecond)]) 
-    os.environ['SPARK_CONFIG__AZURE_SYNAPSE__WORKSPACE_DIR'] = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_github_ci','_', str(now.minute), '_', str(now.second) ,'_', str(now.microsecond)]) 
-    
+    os.environ['SPARK_CONFIG__DATABRICKS__WORK_DIR'] = ''.join(['dbfs:/feathrazure_cijob','_', str(now.minute), '_', str(now.second), '_', str(now.microsecond)])
+    os.environ['SPARK_CONFIG__AZURE_SYNAPSE__WORKSPACE_DIR'] = ''.join(['abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_github_ci','_', str(now.minute), '_', str(now.second) ,'_', str(now.microsecond)])
+
     client = FeathrClient(config_path="feathr_config.yaml")
     batch_source = HdfsSource(name="nycTaxiBatchSource",
                               path="wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04.csv",
@@ -396,4 +396,4 @@ def test_feathr_materialize_to_aerospike():
 if __name__ == "__main__":
     test_feathr_materialize_to_aerospike()
     test_feathr_get_offline_features_to_sql()
-    test_feathr_materialize_to_cosmosdb()
\ No newline at end of file
+    test_feathr_materialize_to_cosmosdb()

From 7ba88472794c0af61a707eb266f6827153ccd5ff Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Tue, 1 Nov 2022 11:13:13 +0800
Subject: [PATCH 54/68] Fix doc dead links (#805)

This PR fixes dead links detected in latest ci run. The doc scan ci action has been updated to run on main only, as running this in PR frequently reports false alarm due to changes in CI not deployed.
---
 .github/workflows/document-scan.yml                         | 5 ++++-
 docs/quickstart_databricks.md                               | 6 +++---
 .../databricks/databricks_quickstart_nyc_taxi_demo.ipynb    | 2 +-
 .../samples}/nyc_driver_demo.ipynb                          | 6 +++---
 4 files changed, 11 insertions(+), 8 deletions(-)
 rename {feathr_project/feathrcli/data/feathr_user_workspace => docs/samples}/nyc_driver_demo.ipynb (99%)

diff --git a/.github/workflows/document-scan.yml b/.github/workflows/document-scan.yml
index 3762ca2af..291a04f44 100644
--- a/.github/workflows/document-scan.yml
+++ b/.github/workflows/document-scan.yml
@@ -1,6 +1,9 @@
 name: Feathr Documents' Broken Link Check
 
-on: [push]
+on:
+  push:
+    branches: [main]
+
 jobs:
   check-links:
     runs-on: ubuntu-latest
diff --git a/docs/quickstart_databricks.md b/docs/quickstart_databricks.md
index dff5b5f0f..30eaaa835 100644
--- a/docs/quickstart_databricks.md
+++ b/docs/quickstart_databricks.md
@@ -5,13 +5,13 @@ title: Quick Start Guide with Databricks
 
 # Feathr Quick Start Guide with Databricks
 
-For Databricks, you can simply upload [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb) to your Databricks cluster and just run it in the Databricks cluster. It has been pre-configured to use the current Databricks cluster to submit jobs.
+For Databricks, you can simply upload [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb) to your Databricks cluster and just run it in the Databricks cluster. It has been pre-configured to use the current Databricks cluster to submit jobs.
 
 1. Import Notebooks in your Databricks cluster:
 
 ![Import Notebooks](./images/databricks_quickstart1.png)
 
-2. Paste the [link to Databricks getting started notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb):
+2. Paste the [link to Databricks getting started notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb):
 
 ![Import Notebooks](./images/databricks_quickstart2.png)
 
@@ -21,7 +21,7 @@ For Databricks, you can simply upload [this notebook](./samples/databricks/datab
 
 Although Databricks Notebooks are great tools, there are also large developer communities that prefer the usage of Visual Studio Code, where [it has native support for Python and Jupyter Notebooks](https://code.visualstudio.com/docs/datascience/jupyter-notebooks) with many great features such as syntax highlight and IntelliSense.
 
-In [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb), there are a few lines of code like this:
+In [this notebook](./samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb), there are a few lines of code like this:
 
 ```python
 # Get current databricks notebook context
diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
index 13187aa44..0bc099f11 100755
--- a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
+++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb
@@ -1 +1 @@
-{"cells":[{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"843d3142-24ca-4bd1-9e31-b55163804fe3","showTitle":false,"title":""}},"outputs":[],"source":["dbutils.widgets.text(\"RESOURCE_PREFIX\", \"\")\n","dbutils.widgets.text(\"REDIS_KEY\", \"\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"384e5e16-7213-4186-9d04-09d03b155534","showTitle":false,"title":""}},"source":["# Feathr Feature Store on Databricks Demo Notebook\n","\n","This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n","\n","This notebook is specifically written for Databricks and is relying on some of the Databricks packages such as `dbutils`. The intention here is to provide a \"one click run\" example with minimum configuration. For example:\n","- This notebook skips feature registry which requires running Azure Purview. \n","- To make the online feature query work, you will need to configure the Redis endpoint. \n","\n","The full-fledged notebook can be found from [here](https://github.com/feathr-ai/feathr/blob/main/docs/samples/nyc_taxi_demo.ipynb)."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c2ce58c7-9263-469a-bbb7-43364ddb07b8","showTitle":false,"title":""}},"source":["## Prerequisite\n","\n","To use feathr materialization for online scoring with Redis cache, you may deploy a Redis cluster and set `RESOURCE_PREFIX` and `REDIS_KEY` via Databricks widgets. Note that the deployed Redis host address should be `{RESOURCE_PREFIX}redis.redis.cache.windows.net`. More details about how to deploy the Redis cluster can be found [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html#configurure-redis-cluster).\n","\n","To run this notebook, you'll need to install `feathr` pip package. Here, we install notebook-scoped library. For details, please see [Azure Databricks dependency management document](https://learn.microsoft.com/en-us/azure/databricks/libraries/)."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"4609d7ad-ad74-40fc-b97e-f440a0fa0737","showTitle":false,"title":""}},"outputs":[],"source":["!pip install feathr"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c81fa80c-bca6-4ae5-84ad-659a036977bd","showTitle":false,"title":""}},"source":["## Notebook Steps\n","\n","This tutorial demonstrates the key capabilities of Feathr, including:\n","\n","1. Install Feathr and necessary dependencies.\n","1. Create shareable features with Feathr feature definition configs.\n","1. Create training data using point-in-time correct feature join\n","1. Train and evaluate a prediction model.\n","1. Materialize feature values for online scoring.\n","\n","The overall data flow is as follows:\n","\n","<img src=\"https://raw.githubusercontent.com/feathr-ai/feathr/main/docs/images/feature_flow.png\" width=\"800\">"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"80223a02-631c-40c8-91b3-a037249ffff9","showTitle":false,"title":""}},"outputs":[],"source":["from datetime import datetime, timedelta\n","import glob\n","import json\n","from math import sqrt\n","import os\n","from pathlib import Path\n","import requests\n","from tempfile import TemporaryDirectory\n","\n","from azure.identity import AzureCliCredential, DefaultAzureCredential \n","from azure.keyvault.secrets import SecretClient\n","import pandas as pd\n","from pyspark.ml import Pipeline\n","from pyspark.ml.evaluation import RegressionEvaluator\n","from pyspark.ml.feature import VectorAssembler\n","from pyspark.ml.regression import GBTRegressor\n","from pyspark.sql import DataFrame, SparkSession\n","import pyspark.sql.functions as F\n","\n","import feathr\n","from feathr import (\n","    FeathrClient,\n","    # Feature data types\n","    BOOLEAN, FLOAT, INT32, ValueType,\n","    # Feature data sources\n","    INPUT_CONTEXT, HdfsSource,\n","    # Feature aggregations\n","    TypedKey, WindowAggTransformation,\n","    # Feature types and anchor\n","    DerivedFeature, Feature, FeatureAnchor,\n","    # Materialization\n","    BackfillTime, MaterializationSettings, RedisSink,\n","    # Offline feature computation\n","    FeatureQuery, ObservationSettings,\n",")\n","from feathr.datasets import nyc_taxi\n","from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\n","from feathr.utils.config import generate_config\n","from feathr.utils.job_utils import get_result_df\n","\n","\n","print(f\"\"\"Feathr version: {feathr.__version__}\n","Databricks runtime version: {spark.conf.get(\"spark.databricks.clusterUsageTags.sparkVersion\")}\"\"\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"ab35fa01-b392-457e-8fde-7e445a3c39b5","showTitle":false,"title":""}},"source":["## 2. Create Shareable Features with Feathr Feature Definition Configs\n","\n","In this notebook, we define all the necessary resource key values for authentication. We use the values passed by the databricks widgets at the top of this notebook. Instead of manually entering the values to the widgets, we can also use [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) to retrieve them.\n","Please refer to [how-to guide documents for granting key-vault access](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html#3-grant-key-vault-and-synapse-access-to-selected-users-optional) and [Databricks' Azure Key Vault-backed scopes](https://learn.microsoft.com/en-us/azure/databricks/security/secrets/secret-scopes) for more details."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"09f93a9f-7b33-4d91-8f31-ee3b20991696","showTitle":false,"title":""}},"outputs":[],"source":["RESOURCE_PREFIX = dbutils.widgets.get(\"RESOURCE_PREFIX\")\n","PROJECT_NAME = \"feathr_getting_started\"\n","\n","REDIS_KEY = dbutils.widgets.get(\"REDIS_KEY\")\n","\n","# Use a databricks cluster\n","SPARK_CLUSTER = \"databricks\"\n","\n","# Databricks file system path\n","DATA_STORE_PATH = f\"dbfs:/{PROJECT_NAME}\""]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"41d3648a-9bc9-40dc-90da-bc82b21ef9b3","showTitle":false,"title":""}},"source":["In the following cell, we set required databricks credentials automatically by using a databricks notebook context object as well as new job cluster spec.\n","\n","Note: When submitting jobs, Databricks recommend to use new clusters for greater reliability. If you want to use an existing all-purpose cluster, you may set\n","`existing_cluster_id': ctx.tags().get('clusterId').get()` to the `databricks_config`, replacing `new_cluster` config values."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"331753d6-1850-47b5-ad97-84b7c01d79d1","showTitle":false,"title":""}},"outputs":[],"source":["# Redis credential\n","os.environ['REDIS_PASSWORD'] = REDIS_KEY\n","\n","# Setup databricks env configs\n","ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n","databricks_config = {\n","    'run_name': \"FEATHR_FILL_IN\",\n","    # To use an existing all-purpose cluster:\n","    # 'existing_cluster_id': ctx.tags().get('clusterId').get(),\n","    # To use a new job cluster:\n","    'new_cluster': {\n","        'spark_version': \"11.2.x-scala2.12\",\n","        'node_type_id': \"Standard_D3_v2\",\n","        'num_workers':1,\n","        'spark_conf': {\n","            'FEATHR_FILL_IN': \"FEATHR_FILL_IN\",\n","            # Exclude conflicting packages if use feathr <= v0.8.0:\n","            'spark.jars.excludes': \"commons-logging:commons-logging,org.slf4j:slf4j-api,com.google.protobuf:protobuf-java,javax.xml.bind:jaxb-api\",\n","        },\n","    },\n","    'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n","    'spark_jar_task': {\n","        'main_class_name': \"FEATHR_FILL_IN\",\n","        'parameters': [\"FEATHR_FILL_IN\"],\n","    },\n","}\n","os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\n","os.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\n","os.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\n","os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee","showTitle":false,"title":""}},"source":["### Configurations\n","\n","Feathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"8cd64e3a-376c-48e6-ba41-5197f3591d48","showTitle":false,"title":""}},"outputs":[],"source":["config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n","\n","with open(config_path, 'r') as f: \n","    print(f.read())"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"58d22dc1-7590-494d-94ca-3e2488c31c8e","showTitle":false,"title":""}},"source":["All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3fef7f2f-df19-4f53-90a5-ff7999ed983d","showTitle":false,"title":""}},"source":["### Initialize Feathr Client"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"9713a2df-c7b2-4562-88b0-b7acce3cc43a","showTitle":false,"title":""}},"outputs":[],"source":["client = FeathrClient(config_path=config_path)"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c3b64bda-d42c-4a64-b976-0fb604cf38c5","showTitle":false,"title":""}},"source":["### View the NYC taxi fare dataset"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c4ccd7b3-298a-4e5a-8eec-b7e309db393e","showTitle":false,"title":""}},"outputs":[],"source":["DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n","\n","# Download the data file\n","df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\n","df_raw.limit(5).toPandas()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"7430c942-64e5-4b70-b823-16ce1d1b3cee","showTitle":false,"title":""}},"source":["### Defining features with Feathr\n","\n","In Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n","\n","* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n","* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n","* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n","\n","Note that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n","\n","There are two types of features -- anchored features and derivated features:\n","\n","* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n","* **Derived features**: Features that are computed on top of other features.\n","\n","#### Define anchored features\n","\n","A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"75b8d2ed-84df-4446-ae07-5f715434f3ea","showTitle":false,"title":""}},"outputs":[],"source":["TIMESTAMP_COL = \"lpep_dropoff_datetime\"\n","TIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"93abbcc2-562b-47e4-ad4c-1fedd7cc64df","showTitle":false,"title":""}},"outputs":[],"source":["# We define f_trip_distance and f_trip_time_duration features separately\n","# so that we can reuse them later for the derived features.\n","f_trip_distance = Feature(\n","    name=\"f_trip_distance\",\n","    feature_type=FLOAT,\n","    transform=\"trip_distance\",\n",")\n","f_trip_time_duration = Feature(\n","    name=\"f_trip_time_duration\",\n","    feature_type=FLOAT,\n","    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n",")\n","\n","features = [\n","    f_trip_distance,\n","    f_trip_time_duration,\n","    Feature(\n","        name=\"f_is_long_trip_distance\",\n","        feature_type=BOOLEAN,\n","        transform=\"trip_distance > 30.0\",\n","    ),\n","    Feature(\n","        name=\"f_day_of_week\",\n","        feature_type=INT32,\n","        transform=\"dayofweek(lpep_dropoff_datetime)\",\n","    ),\n","    Feature(\n","        name=\"f_day_of_month\",\n","        feature_type=INT32,\n","        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n","    ),\n","    Feature(\n","        name=\"f_hour_of_day\",\n","        feature_type=INT32,\n","        transform=\"hour(lpep_dropoff_datetime)\",\n","    ),\n","]\n","\n","# After you have defined features, bring them together to build the anchor to the source.\n","feature_anchor = FeatureAnchor(\n","    name=\"feature_anchor\",\n","    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n","    features=features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"728d2d5f-c11f-4941-bdc5-48507f5749f1","showTitle":false,"title":""}},"source":["We can define the source with a preprocessing python function."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3cc59a0e-a41b-480e-a84e-ca5443d63143","showTitle":false,"title":""}},"outputs":[],"source":["def preprocessing(df: DataFrame) -> DataFrame:\n","    import pyspark.sql.functions as F\n","    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n","    return df\n","\n","batch_source = HdfsSource(\n","    name=\"nycTaxiBatchSource\",\n","    path=DATA_FILE_PATH,\n","    event_timestamp_column=TIMESTAMP_COL,\n","    preprocessing=preprocessing,\n","    timestamp_format=TIMESTAMP_FORMAT,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"46f863c4-bb81-434a-a448-6b585031a221","showTitle":false,"title":""}},"source":["For the features with aggregation, the supported functions are as follows:\n","\n","| Aggregation Function | Input Type | Description |\n","| --- | --- | --- |\n","|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n","|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n","|LATEST| Any |Returns the latest not-null values from within the defined time window |"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"a373ecbe-a040-4cd3-9d87-0d5f4c5ba553","showTitle":false,"title":""}},"outputs":[],"source":["agg_key = TypedKey(\n","    key_column=\"DOLocationID\",\n","    key_column_type=ValueType.INT32,\n","    description=\"location id in NYC\",\n","    full_name=\"nyc_taxi.location_id\",\n",")\n","\n","agg_window = \"90d\"\n","\n","# Anchored features with aggregations\n","agg_features = [\n","    Feature(\n","        name=\"f_location_avg_fare\",\n","        key=agg_key,\n","        feature_type=FLOAT,\n","        transform=WindowAggTransformation(\n","            agg_expr=\"fare_amount_cents\",\n","            agg_func=\"AVG\",\n","            window=agg_window,\n","        ),\n","    ),\n","    Feature(\n","        name=\"f_location_max_fare\",\n","        key=agg_key,\n","        feature_type=FLOAT,\n","        transform=WindowAggTransformation(\n","            agg_expr=\"fare_amount_cents\",\n","            agg_func=\"MAX\",\n","            window=agg_window,\n","        ),\n","    ),\n","]\n","\n","agg_feature_anchor = FeatureAnchor(\n","    name=\"agg_feature_anchor\",\n","    source=batch_source,  # External data source for feature. Typically a data table.\n","    features=agg_features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"149f85e2-fa3c-4895-b0c5-de5543ca9b6d","showTitle":false,"title":""}},"source":["#### Define derived features\n","\n","We also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"05633bc3-9118-449b-9562-45fc437576c2","showTitle":false,"title":""}},"outputs":[],"source":["derived_features = [\n","    DerivedFeature(\n","        name=\"f_trip_time_distance\",\n","        feature_type=FLOAT,\n","        input_features=[\n","            f_trip_distance,\n","            f_trip_time_duration,\n","        ],\n","        transform=\"f_trip_distance / f_trip_time_duration\",\n","    )\n","]"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"ad102c45-586d-468c-85f0-9454401ef10b","showTitle":false,"title":""}},"source":["### Build features\n","\n","Finally, we build the features."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"91bb5ebb-87e4-470b-b8eb-1c89b351740e","showTitle":false,"title":""}},"outputs":[],"source":["client.build_features(\n","    anchor_list=[feature_anchor, agg_feature_anchor],\n","    derived_feature_list=derived_features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"632d5f46-f9e2-41a8-aab7-34f75206e2aa","showTitle":false,"title":""}},"source":["## 3. Create Training Data Using Point-in-Time Correct Feature Join\n","\n","After the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n","\n","To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n","what features and how these features should be joined to the observation data. \n","\n","To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"02feabc9-2f2f-43e8-898d-b28082798e98","showTitle":false,"title":""}},"outputs":[],"source":["feature_names = [feature.name for feature in features + agg_features + derived_features]\n","feature_names"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f","showTitle":false,"title":""}},"outputs":[],"source":["DATA_FORMAT = \"parquet\"\n","offline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"67e81466-c736-47ba-b122-e640642c01cf","showTitle":false,"title":""}},"outputs":[],"source":["# Features that we want to request. Can use a subset of features\n","query = FeatureQuery(\n","    feature_list=feature_names,\n","    key=agg_key,\n",")\n","settings = ObservationSettings(\n","    observation_path=DATA_FILE_PATH,\n","    event_timestamp_column=TIMESTAMP_COL,\n","    timestamp_format=TIMESTAMP_FORMAT,\n",")\n","client.get_offline_features(\n","    observation_settings=settings,\n","    feature_query=query,\n","    # Note, execution_configurations argument only works when using a new job cluster\n","    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n","    execution_configurations=SparkExecutionConfiguration({\n","        \"spark.feathr.outputFormat\": DATA_FORMAT,\n","    }),\n","    output_path=offline_features_path,\n",")\n","\n","client.wait_job_to_finish(timeout_sec=500)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"9871af55-25eb-41ee-a58a-fda74b1a174e","showTitle":false,"title":""}},"outputs":[],"source":["# Show feature results\n","df = get_result_df(\n","    spark=spark,\n","    client=client,\n","    data_format=\"parquet\",\n","    res_url=offline_features_path,\n",")\n","df.select(feature_names).limit(5).toPandas()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f","showTitle":false,"title":""}},"source":["## 4. Train and Evaluate a Prediction Model\n","\n","After generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n","\n","Note that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"5a226026-1c7b-48db-8f91-88d5c2ddf023","showTitle":false,"title":""}},"source":["### Load Train and Test Data from the Offline Feature Values"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"bd2cdc83-0920-46e8-9454-e5e6e7832ce0","showTitle":false,"title":""}},"outputs":[],"source":["# Train / test split\n","train_df, test_df = (\n","    df  # Dataframe that we generated from get_offline_features call.\n","    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n","    .where(F.col(\"f_trip_time_duration\") > 0)\n","    .fillna(0)\n","    .randomSplit([0.8, 0.2])\n",")\n","\n","print(f\"Num train samples: {train_df.count()}\")\n","print(f\"Num test samples: {test_df.count()}\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd","showTitle":false,"title":""}},"source":["### Build a ML Pipeline\n","\n","Here, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"2a254361-63e9-45b2-8c19-40549762eacb","showTitle":false,"title":""}},"outputs":[],"source":["# Generate a feature vector column for SparkML\n","vector_assembler = VectorAssembler(\n","    inputCols=[x for x in df.columns if x in feature_names],\n","    outputCol=\"features\",\n",")\n","\n","# Define a model\n","gbt = GBTRegressor(\n","    featuresCol=\"features\",\n","    maxIter=100,\n","    maxDepth=5,\n","    maxBins=16,\n",")\n","\n","# Create a ML pipeline\n","ml_pipeline = Pipeline(stages=[\n","    vector_assembler,\n","    gbt,\n","])"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"bef93538-9591-4247-97b6-289d2055b7b1","showTitle":false,"title":""}},"source":["### Train and Evaluate the Model"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"0c3d5f35-11a3-4644-9992-5860169d8302","showTitle":false,"title":""}},"outputs":[],"source":["# Train a model\n","model = ml_pipeline.fit(train_df)\n","\n","# Make predictions\n","predictions = model.transform(test_df)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"1f9b584c-6228-4a02-a6c3-9b8dd2b78091","showTitle":false,"title":""}},"outputs":[],"source":["# Evaluate\n","evaluator = RegressionEvaluator(\n","    labelCol=\"label\",\n","    predictionCol=\"prediction\",\n",")\n","\n","rmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\n","mae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\n","print(f\"RMSE: {rmse}\\nMAE: {mae}\")"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"25c33abd-6e87-437d-a6a1-86435f065a1e","showTitle":false,"title":""}},"outputs":[],"source":["# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\n","predictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n","\n","predictions_pdf.plot(\n","    x=\"index\",\n","    y=[\"label\", \"prediction\"],\n","    style=['-', ':'],\n","    figsize=(20, 10),\n",")"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"664d78cc-4a92-430c-9e05-565ba904558e","showTitle":false,"title":""}},"outputs":[],"source":["predictions_pdf.plot.scatter(\n","    x=\"label\",\n","    y=\"prediction\",\n","    xlim=(0, 100),\n","    ylim=(0, 100),\n","    figsize=(10, 10),\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"8a56d165-c813-4ce0-8ae6-9f4d313c463d","showTitle":false,"title":""}},"source":["## 5. Materialize Feature Values for Online Scoring\n","\n","While we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n","\n","Note, only the features anchored to offline data source can be materialized."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"751fa72e-8f94-40a1-994e-3e8315b51d37","showTitle":false,"title":""}},"outputs":[],"source":["materialized_feature_names = [feature.name for feature in agg_features]\n","materialized_feature_names"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"4d4699ed-42e6-408f-903d-2f799284f4b6","showTitle":false,"title":""}},"outputs":[],"source":["if REDIS_KEY and RESOURCE_PREFIX:\n","    FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n","\n","    # Get the last date from the dataset\n","    backfill_timestamp = (\n","        df_raw\n","        .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n","        .agg({TIMESTAMP_COL: \"max\"})\n","        .collect()[0][0]\n","    )\n","\n","    # Time range to materialize\n","    backfill_time = BackfillTime(\n","        start=backfill_timestamp,\n","        end=backfill_timestamp,\n","        step=timedelta(days=1),\n","    )\n","\n","    # Destinations:\n","    # For online store,\n","    redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n","\n","    # For offline store,\n","    # adls_sink = HdfsSink(output_path=)\n","\n","    settings = MaterializationSettings(\n","        name=FEATURE_TABLE_NAME + \".job\",  # job name\n","        backfill_time=backfill_time,\n","        sinks=[redis_sink],  # or adls_sink\n","        feature_names=materialized_feature_names,\n","    )\n","\n","    client.materialize_features(\n","        settings=settings,\n","        # Note, execution_configurations argument only works when using a new job cluster\n","        execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n","    )\n","\n","    client.wait_job_to_finish(timeout_sec=500)"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"5aa13acd-58ec-4fc2-86bb-dc1d9951ebb9","showTitle":false,"title":""}},"source":["Now, you can retrieve features for online scoring as follows:"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"424bc9eb-a47f-4b46-be69-8218d55e66ad","showTitle":false,"title":""}},"outputs":[],"source":["if REDIS_KEY and RESOURCE_PREFIX:\n","    # Note, to get a single key, you may use client.get_online_features instead\n","    materialized_feature_values = client.multi_get_online_features(\n","        feature_table=FEATURE_TABLE_NAME,\n","        keys=[\"239\", \"265\"],\n","        feature_names=materialized_feature_names,\n","    )\n","    materialized_feature_values"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3596dc71-a363-4b6a-a169-215c89978558","showTitle":false,"title":""}},"source":["## Cleanup"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"b5fb292e-bbb6-4dd7-8e79-c62d9533e820","showTitle":false,"title":""}},"outputs":[],"source":["# Remove temporary files\n","dbutils.fs.rm(\"dbfs:/tmp/\", recurse=True)"]}],"metadata":{"application/vnd.databricks.v1+notebook":{"dashboards":[],"language":"python","notebookMetadata":{"pythonIndentUnit":4},"notebookName":"databricks_quickstart_nyc_taxi_demo","notebookOrigID":2365994027381987,"widgets":{"REDIS_KEY":{"currentValue":"","nuid":"d39ce0d5-bcfe-47ef-b3d9-eff67e5cdeca","widgetInfo":{"defaultValue":"","label":null,"name":"REDIS_KEY","options":{"validationRegex":null,"widgetType":"text"},"widgetType":"text"}},"RESOURCE_PREFIX":{"currentValue":"","nuid":"87a26035-86fc-4dbd-8dd0-dc546c1c63c1","widgetInfo":{"defaultValue":"","label":null,"name":"RESOURCE_PREFIX","options":{"validationRegex":null,"widgetType":"text"},"widgetType":"text"}}}},"kernelspec":{"display_name":"Python 3.10.4 ('feathr')","language":"python","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.10.4"},"vscode":{"interpreter":{"hash":"ddb0e38f168d5afaa0b8ab4851ddd8c14364f1d087c15de6ff2ee5a559aec1f2"}}},"nbformat":4,"nbformat_minor":0}
+{"cells":[{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"843d3142-24ca-4bd1-9e31-b55163804fe3","showTitle":false,"title":""}},"outputs":[],"source":["dbutils.widgets.text(\"RESOURCE_PREFIX\", \"\")\n","dbutils.widgets.text(\"REDIS_KEY\", \"\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"384e5e16-7213-4186-9d04-09d03b155534","showTitle":false,"title":""}},"source":["# Feathr Feature Store on Databricks Demo Notebook\n","\n","This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page).\n","\n","This notebook is specifically written for Databricks and is relying on some of the Databricks packages such as `dbutils`. The intention here is to provide a \"one click run\" example with minimum configuration. For example:\n","- This notebook skips feature registry which requires running Azure Purview. \n","- To make the online feature query work, you will need to configure the Redis endpoint. \n","\n","The full-fledged notebook can be found from [here](https://github.com/feathr-ai/feathr/blob/main/docs/samples/nyc_taxi_demo.ipynb)."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c2ce58c7-9263-469a-bbb7-43364ddb07b8","showTitle":false,"title":""}},"source":["## Prerequisite\n","\n","To use feathr materialization for online scoring with Redis cache, you may deploy a Redis cluster and set `RESOURCE_PREFIX` and `REDIS_KEY` via Databricks widgets. Note that the deployed Redis host address should be `{RESOURCE_PREFIX}redis.redis.cache.windows.net`. More details about how to deploy the Redis cluster can be found [here](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-cli.html#configurure-redis-cluster).\n","\n","To run this notebook, you'll need to install `feathr` pip package. Here, we install notebook-scoped library. For details, please see [Azure Databricks dependency management document](https://learn.microsoft.com/en-us/azure/databricks/libraries/)."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"4609d7ad-ad74-40fc-b97e-f440a0fa0737","showTitle":false,"title":""}},"outputs":[],"source":["!pip install feathr"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c81fa80c-bca6-4ae5-84ad-659a036977bd","showTitle":false,"title":""}},"source":["## Notebook Steps\n","\n","This tutorial demonstrates the key capabilities of Feathr, including:\n","\n","1. Install Feathr and necessary dependencies.\n","1. Create shareable features with Feathr feature definition configs.\n","1. Create training data using point-in-time correct feature join\n","1. Train and evaluate a prediction model.\n","1. Materialize feature values for online scoring.\n","\n","The overall data flow is as follows:\n","\n","<img src=\"https://raw.githubusercontent.com/feathr-ai/feathr/main/docs/images/feature_flow.png\" width=\"800\">"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"80223a02-631c-40c8-91b3-a037249ffff9","showTitle":false,"title":""}},"outputs":[],"source":["from datetime import datetime, timedelta\n","import glob\n","import json\n","from math import sqrt\n","import os\n","from pathlib import Path\n","import requests\n","from tempfile import TemporaryDirectory\n","\n","from azure.identity import AzureCliCredential, DefaultAzureCredential \n","from azure.keyvault.secrets import SecretClient\n","import pandas as pd\n","from pyspark.ml import Pipeline\n","from pyspark.ml.evaluation import RegressionEvaluator\n","from pyspark.ml.feature import VectorAssembler\n","from pyspark.ml.regression import GBTRegressor\n","from pyspark.sql import DataFrame, SparkSession\n","import pyspark.sql.functions as F\n","\n","import feathr\n","from feathr import (\n","    FeathrClient,\n","    # Feature data types\n","    BOOLEAN, FLOAT, INT32, ValueType,\n","    # Feature data sources\n","    INPUT_CONTEXT, HdfsSource,\n","    # Feature aggregations\n","    TypedKey, WindowAggTransformation,\n","    # Feature types and anchor\n","    DerivedFeature, Feature, FeatureAnchor,\n","    # Materialization\n","    BackfillTime, MaterializationSettings, RedisSink,\n","    # Offline feature computation\n","    FeatureQuery, ObservationSettings,\n",")\n","from feathr.datasets import nyc_taxi\n","from feathr.spark_provider.feathr_configurations import SparkExecutionConfiguration\n","from feathr.utils.config import generate_config\n","from feathr.utils.job_utils import get_result_df\n","\n","\n","print(f\"\"\"Feathr version: {feathr.__version__}\n","Databricks runtime version: {spark.conf.get(\"spark.databricks.clusterUsageTags.sparkVersion\")}\"\"\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"ab35fa01-b392-457e-8fde-7e445a3c39b5","showTitle":false,"title":""}},"source":["## 2. Create Shareable Features with Feathr Feature Definition Configs\n","\n","In this notebook, we define all the necessary resource key values for authentication. We use the values passed by the databricks widgets at the top of this notebook. Instead of manually entering the values to the widgets, we can also use [Azure Key Vault](https://azure.microsoft.com/en-us/services/key-vault/) to retrieve them.\n","Please refer to [how-to guide documents for granting key-vault access](https://feathr-ai.github.io/feathr/how-to-guides/azure-deployment-arm.html#3-grant-key-vault-and-synapse-access-to-selected-users-optional) and [Databricks' Azure Key Vault-backed scopes](https://learn.microsoft.com/en-us/azure/databricks/security/secrets/secret-scopes) for more details."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"09f93a9f-7b33-4d91-8f31-ee3b20991696","showTitle":false,"title":""}},"outputs":[],"source":["RESOURCE_PREFIX = dbutils.widgets.get(\"RESOURCE_PREFIX\")\n","PROJECT_NAME = \"feathr_getting_started\"\n","\n","REDIS_KEY = dbutils.widgets.get(\"REDIS_KEY\")\n","\n","# Use a databricks cluster\n","SPARK_CLUSTER = \"databricks\"\n","\n","# Databricks file system path\n","DATA_STORE_PATH = f\"dbfs:/{PROJECT_NAME}\""]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"41d3648a-9bc9-40dc-90da-bc82b21ef9b3","showTitle":false,"title":""}},"source":["In the following cell, we set required databricks credentials automatically by using a databricks notebook context object as well as new job cluster spec.\n","\n","Note: When submitting jobs, Databricks recommend to use new clusters for greater reliability. If you want to use an existing all-purpose cluster, you may set\n","`existing_cluster_id': ctx.tags().get('clusterId').get()` to the `databricks_config`, replacing `new_cluster` config values."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"331753d6-1850-47b5-ad97-84b7c01d79d1","showTitle":false,"title":""}},"outputs":[],"source":["# Redis credential\n","os.environ['REDIS_PASSWORD'] = REDIS_KEY\n","\n","# Setup databricks env configs\n","ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n","databricks_config = {\n","    'run_name': \"FEATHR_FILL_IN\",\n","    # To use an existing all-purpose cluster:\n","    # 'existing_cluster_id': ctx.tags().get('clusterId').get(),\n","    # To use a new job cluster:\n","    'new_cluster': {\n","        'spark_version': \"11.2.x-scala2.12\",\n","        'node_type_id': \"Standard_D3_v2\",\n","        'num_workers':1,\n","        'spark_conf': {\n","            'FEATHR_FILL_IN': \"FEATHR_FILL_IN\",\n","            # Exclude conflicting packages if use feathr <= v0.8.0:\n","            'spark.jars.excludes': \"commons-logging:commons-logging,org.slf4j:slf4j-api,com.google.protobuf:protobuf-java,javax.xml.bind:jaxb-api\",\n","        },\n","    },\n","    'libraries': [{'jar': \"FEATHR_FILL_IN\"}],\n","    'spark_jar_task': {\n","        'main_class_name': \"FEATHR_FILL_IN\",\n","        'parameters': [\"FEATHR_FILL_IN\"],\n","    },\n","}\n","os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + ctx.tags().get('browserHostName').get()\n","os.environ['spark_config__databricks__config_template'] = json.dumps(databricks_config)\n","os.environ['spark_config__databricks__work_dir'] = \"dbfs:/feathr_getting_started\"\n","os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = ctx.apiToken().get()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee","showTitle":false,"title":""}},"source":["### Configurations\n","\n","Feathr uses a yaml file to define configurations. Please refer to [feathr_config.yaml]( https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml) for the meaning of each field."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"8cd64e3a-376c-48e6-ba41-5197f3591d48","showTitle":false,"title":""}},"outputs":[],"source":["config_path = generate_config(project_name=PROJECT_NAME, spark_cluster=SPARK_CLUSTER, resource_prefix=RESOURCE_PREFIX)\n","\n","with open(config_path, 'r') as f: \n","    print(f.read())"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"58d22dc1-7590-494d-94ca-3e2488c31c8e","showTitle":false,"title":""}},"source":["All the configurations can be overwritten by environment variables with concatenation of `__` for different layers of the config file. For example, `feathr_runtime_location` for databricks config can be overwritten by setting `spark_config__databricks__feathr_runtime_location` environment variable."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3fef7f2f-df19-4f53-90a5-ff7999ed983d","showTitle":false,"title":""}},"source":["### Initialize Feathr Client"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"9713a2df-c7b2-4562-88b0-b7acce3cc43a","showTitle":false,"title":""}},"outputs":[],"source":["client = FeathrClient(config_path=config_path)"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c3b64bda-d42c-4a64-b976-0fb604cf38c5","showTitle":false,"title":""}},"source":["### View the NYC taxi fare dataset"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"c4ccd7b3-298a-4e5a-8eec-b7e309db393e","showTitle":false,"title":""}},"outputs":[],"source":["DATA_FILE_PATH = str(Path(DATA_STORE_PATH, \"nyc_taxi.csv\"))\n","\n","# Download the data file\n","df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\n","df_raw.limit(5).toPandas()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"7430c942-64e5-4b70-b823-16ce1d1b3cee","showTitle":false,"title":""}},"source":["### Defining features with Feathr\n","\n","In Feathr, a feature is viewed as a function, mapping a key and timestamp to a feature value. For more details, please see [Feathr Feature Definition Guide](https://github.com/feathr-ai/feathr/blob/main/docs/concepts/feature-definition.md).\n","\n","* The feature key (a.k.a. entity id) identifies the subject of feature, e.g. a user_id or location_id.\n","* The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n","* The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022.\n","\n","Note that, in some cases, a feature could be just a transformation function that has no entity key or timestamp involved, e.g. *the day of week of the request timestamp*.\n","\n","There are two types of features -- anchored features and derivated features:\n","\n","* **Anchored features**: Features that are directly extracted from sources. Could be with or without aggregation. \n","* **Derived features**: Features that are computed on top of other features.\n","\n","#### Define anchored features\n","\n","A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. A source value should be either `INPUT_CONTEXT` (the features that will be extracted from the observation data directly) or `feathr.source.Source` object."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"75b8d2ed-84df-4446-ae07-5f715434f3ea","showTitle":false,"title":""}},"outputs":[],"source":["TIMESTAMP_COL = \"lpep_dropoff_datetime\"\n","TIMESTAMP_FORMAT = \"yyyy-MM-dd HH:mm:ss\""]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"93abbcc2-562b-47e4-ad4c-1fedd7cc64df","showTitle":false,"title":""}},"outputs":[],"source":["# We define f_trip_distance and f_trip_time_duration features separately\n","# so that we can reuse them later for the derived features.\n","f_trip_distance = Feature(\n","    name=\"f_trip_distance\",\n","    feature_type=FLOAT,\n","    transform=\"trip_distance\",\n",")\n","f_trip_time_duration = Feature(\n","    name=\"f_trip_time_duration\",\n","    feature_type=FLOAT,\n","    transform=\"cast_float((to_unix_timestamp(lpep_dropoff_datetime) - to_unix_timestamp(lpep_pickup_datetime)) / 60)\",\n",")\n","\n","features = [\n","    f_trip_distance,\n","    f_trip_time_duration,\n","    Feature(\n","        name=\"f_is_long_trip_distance\",\n","        feature_type=BOOLEAN,\n","        transform=\"trip_distance > 30.0\",\n","    ),\n","    Feature(\n","        name=\"f_day_of_week\",\n","        feature_type=INT32,\n","        transform=\"dayofweek(lpep_dropoff_datetime)\",\n","    ),\n","    Feature(\n","        name=\"f_day_of_month\",\n","        feature_type=INT32,\n","        transform=\"dayofmonth(lpep_dropoff_datetime)\",\n","    ),\n","    Feature(\n","        name=\"f_hour_of_day\",\n","        feature_type=INT32,\n","        transform=\"hour(lpep_dropoff_datetime)\",\n","    ),\n","]\n","\n","# After you have defined features, bring them together to build the anchor to the source.\n","feature_anchor = FeatureAnchor(\n","    name=\"feature_anchor\",\n","    source=INPUT_CONTEXT,  # Pass through source, i.e. observation data.\n","    features=features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"728d2d5f-c11f-4941-bdc5-48507f5749f1","showTitle":false,"title":""}},"source":["We can define the source with a preprocessing python function."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3cc59a0e-a41b-480e-a84e-ca5443d63143","showTitle":false,"title":""}},"outputs":[],"source":["def preprocessing(df: DataFrame) -> DataFrame:\n","    import pyspark.sql.functions as F\n","    df = df.withColumn(\"fare_amount_cents\", (F.col(\"fare_amount\") * 100.0).cast(\"float\"))\n","    return df\n","\n","batch_source = HdfsSource(\n","    name=\"nycTaxiBatchSource\",\n","    path=DATA_FILE_PATH,\n","    event_timestamp_column=TIMESTAMP_COL,\n","    preprocessing=preprocessing,\n","    timestamp_format=TIMESTAMP_FORMAT,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"46f863c4-bb81-434a-a448-6b585031a221","showTitle":false,"title":""}},"source":["For the features with aggregation, the supported functions are as follows:\n","\n","| Aggregation Function | Input Type | Description |\n","| --- | --- | --- |\n","|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n","|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n","|LATEST| Any |Returns the latest not-null values from within the defined time window |"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"a373ecbe-a040-4cd3-9d87-0d5f4c5ba553","showTitle":false,"title":""}},"outputs":[],"source":["agg_key = TypedKey(\n","    key_column=\"DOLocationID\",\n","    key_column_type=ValueType.INT32,\n","    description=\"location id in NYC\",\n","    full_name=\"nyc_taxi.location_id\",\n",")\n","\n","agg_window = \"90d\"\n","\n","# Anchored features with aggregations\n","agg_features = [\n","    Feature(\n","        name=\"f_location_avg_fare\",\n","        key=agg_key,\n","        feature_type=FLOAT,\n","        transform=WindowAggTransformation(\n","            agg_expr=\"fare_amount_cents\",\n","            agg_func=\"AVG\",\n","            window=agg_window,\n","        ),\n","    ),\n","    Feature(\n","        name=\"f_location_max_fare\",\n","        key=agg_key,\n","        feature_type=FLOAT,\n","        transform=WindowAggTransformation(\n","            agg_expr=\"fare_amount_cents\",\n","            agg_func=\"MAX\",\n","            window=agg_window,\n","        ),\n","    ),\n","]\n","\n","agg_feature_anchor = FeatureAnchor(\n","    name=\"agg_feature_anchor\",\n","    source=batch_source,  # External data source for feature. Typically a data table.\n","    features=agg_features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"149f85e2-fa3c-4895-b0c5-de5543ca9b6d","showTitle":false,"title":""}},"source":["#### Define derived features\n","\n","We also define a derived feature, `f_trip_time_distance`, from the anchored features `f_trip_distance` and `f_trip_time_duration` as follows:"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"05633bc3-9118-449b-9562-45fc437576c2","showTitle":false,"title":""}},"outputs":[],"source":["derived_features = [\n","    DerivedFeature(\n","        name=\"f_trip_time_distance\",\n","        feature_type=FLOAT,\n","        input_features=[\n","            f_trip_distance,\n","            f_trip_time_duration,\n","        ],\n","        transform=\"f_trip_distance / f_trip_time_duration\",\n","    )\n","]"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"ad102c45-586d-468c-85f0-9454401ef10b","showTitle":false,"title":""}},"source":["### Build features\n","\n","Finally, we build the features."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"91bb5ebb-87e4-470b-b8eb-1c89b351740e","showTitle":false,"title":""}},"outputs":[],"source":["client.build_features(\n","    anchor_list=[feature_anchor, agg_feature_anchor],\n","    derived_feature_list=derived_features,\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"632d5f46-f9e2-41a8-aab7-34f75206e2aa","showTitle":false,"title":""}},"source":["## 3. Create Training Data Using Point-in-Time Correct Feature Join\n","\n","After the feature producers have defined the features (as described in the Feature Definition part), the feature consumers may want to consume those features. Feature consumers will use observation data to query from different feature tables using Feature Query.\n","\n","To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n","what features and how these features should be joined to the observation data. \n","\n","To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"02feabc9-2f2f-43e8-898d-b28082798e98","showTitle":false,"title":""}},"outputs":[],"source":["feature_names = [feature.name for feature in features + agg_features + derived_features]\n","feature_names"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f","showTitle":false,"title":""}},"outputs":[],"source":["DATA_FORMAT = \"parquet\"\n","offline_features_path = str(Path(DATA_STORE_PATH, \"feathr_output\", f\"features.{DATA_FORMAT}\"))"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"67e81466-c736-47ba-b122-e640642c01cf","showTitle":false,"title":""}},"outputs":[],"source":["# Features that we want to request. Can use a subset of features\n","query = FeatureQuery(\n","    feature_list=feature_names,\n","    key=agg_key,\n",")\n","settings = ObservationSettings(\n","    observation_path=DATA_FILE_PATH,\n","    event_timestamp_column=TIMESTAMP_COL,\n","    timestamp_format=TIMESTAMP_FORMAT,\n",")\n","client.get_offline_features(\n","    observation_settings=settings,\n","    feature_query=query,\n","    # Note, execution_configurations argument only works when using a new job cluster\n","    # For more details, see https://feathr-ai.github.io/feathr/how-to-guides/feathr-job-configuration.html\n","    execution_configurations=SparkExecutionConfiguration({\n","        \"spark.feathr.outputFormat\": DATA_FORMAT,\n","    }),\n","    output_path=offline_features_path,\n",")\n","\n","client.wait_job_to_finish(timeout_sec=500)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"9871af55-25eb-41ee-a58a-fda74b1a174e","showTitle":false,"title":""}},"outputs":[],"source":["# Show feature results\n","df = get_result_df(\n","    spark=spark,\n","    client=client,\n","    data_format=\"parquet\",\n","    res_url=offline_features_path,\n",")\n","df.select(feature_names).limit(5).toPandas()"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f","showTitle":false,"title":""}},"source":["## 4. Train and Evaluate a Prediction Model\n","\n","After generating all the features, we train and evaluate a machine learning model to predict the NYC taxi fare prediction. In this example, we use Spark MLlib's [GBTRegressor](https://spark.apache.org/docs/latest/ml-classification-regression.html#gradient-boosted-tree-regression).\n","\n","Note that designing features, training prediction models and evaluating them are an iterative process where the models' performance maybe used to modify the features as a part of the modeling process."]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"5a226026-1c7b-48db-8f91-88d5c2ddf023","showTitle":false,"title":""}},"source":["### Load Train and Test Data from the Offline Feature Values"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"bd2cdc83-0920-46e8-9454-e5e6e7832ce0","showTitle":false,"title":""}},"outputs":[],"source":["# Train / test split\n","train_df, test_df = (\n","    df  # Dataframe that we generated from get_offline_features call.\n","    .withColumn(\"label\", F.col(\"fare_amount\").cast(\"double\"))\n","    .where(F.col(\"f_trip_time_duration\") > 0)\n","    .fillna(0)\n","    .randomSplit([0.8, 0.2])\n",")\n","\n","print(f\"Num train samples: {train_df.count()}\")\n","print(f\"Num test samples: {test_df.count()}\")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd","showTitle":false,"title":""}},"source":["### Build a ML Pipeline\n","\n","Here, we use Spark ML Pipeline to aggregate feature vectors and feed them to the model."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"2a254361-63e9-45b2-8c19-40549762eacb","showTitle":false,"title":""}},"outputs":[],"source":["# Generate a feature vector column for SparkML\n","vector_assembler = VectorAssembler(\n","    inputCols=[x for x in df.columns if x in feature_names],\n","    outputCol=\"features\",\n",")\n","\n","# Define a model\n","gbt = GBTRegressor(\n","    featuresCol=\"features\",\n","    maxIter=100,\n","    maxDepth=5,\n","    maxBins=16,\n",")\n","\n","# Create a ML pipeline\n","ml_pipeline = Pipeline(stages=[\n","    vector_assembler,\n","    gbt,\n","])"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"bef93538-9591-4247-97b6-289d2055b7b1","showTitle":false,"title":""}},"source":["### Train and Evaluate the Model"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"0c3d5f35-11a3-4644-9992-5860169d8302","showTitle":false,"title":""}},"outputs":[],"source":["# Train a model\n","model = ml_pipeline.fit(train_df)\n","\n","# Make predictions\n","predictions = model.transform(test_df)"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"1f9b584c-6228-4a02-a6c3-9b8dd2b78091","showTitle":false,"title":""}},"outputs":[],"source":["# Evaluate\n","evaluator = RegressionEvaluator(\n","    labelCol=\"label\",\n","    predictionCol=\"prediction\",\n",")\n","\n","rmse = evaluator.evaluate(predictions, {evaluator.metricName: \"rmse\"})\n","mae = evaluator.evaluate(predictions, {evaluator.metricName: \"mae\"})\n","print(f\"RMSE: {rmse}\\nMAE: {mae}\")"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"25c33abd-6e87-437d-a6a1-86435f065a1e","showTitle":false,"title":""}},"outputs":[],"source":["# predicted fare vs actual fare plots -- will this work for databricks / synapse / local ?\n","predictions_pdf = predictions.select([\"label\", \"prediction\"]).toPandas().reset_index()\n","\n","predictions_pdf.plot(\n","    x=\"index\",\n","    y=[\"label\", \"prediction\"],\n","    style=['-', ':'],\n","    figsize=(20, 10),\n",")"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"664d78cc-4a92-430c-9e05-565ba904558e","showTitle":false,"title":""}},"outputs":[],"source":["predictions_pdf.plot.scatter(\n","    x=\"label\",\n","    y=\"prediction\",\n","    xlim=(0, 100),\n","    ylim=(0, 100),\n","    figsize=(10, 10),\n",")"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"8a56d165-c813-4ce0-8ae6-9f4d313c463d","showTitle":false,"title":""}},"source":["## 5. Materialize Feature Values for Online Scoring\n","\n","While we computed feature values on-the-fly at request time via Feathr, we can pre-compute the feature values and materialize them to offline or online storages such as Redis.\n","\n","Note, only the features anchored to offline data source can be materialized."]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"751fa72e-8f94-40a1-994e-3e8315b51d37","showTitle":false,"title":""}},"outputs":[],"source":["materialized_feature_names = [feature.name for feature in agg_features]\n","materialized_feature_names"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"4d4699ed-42e6-408f-903d-2f799284f4b6","showTitle":false,"title":""}},"outputs":[],"source":["if REDIS_KEY and RESOURCE_PREFIX:\n","    FEATURE_TABLE_NAME = \"nycTaxiDemoFeature\"\n","\n","    # Get the last date from the dataset\n","    backfill_timestamp = (\n","        df_raw\n","        .select(F.to_timestamp(F.col(TIMESTAMP_COL), TIMESTAMP_FORMAT).alias(TIMESTAMP_COL))\n","        .agg({TIMESTAMP_COL: \"max\"})\n","        .collect()[0][0]\n","    )\n","\n","    # Time range to materialize\n","    backfill_time = BackfillTime(\n","        start=backfill_timestamp,\n","        end=backfill_timestamp,\n","        step=timedelta(days=1),\n","    )\n","\n","    # Destinations:\n","    # For online store,\n","    redis_sink = RedisSink(table_name=FEATURE_TABLE_NAME)\n","\n","    # For offline store,\n","    # adls_sink = HdfsSink(output_path=)\n","\n","    settings = MaterializationSettings(\n","        name=FEATURE_TABLE_NAME + \".job\",  # job name\n","        backfill_time=backfill_time,\n","        sinks=[redis_sink],  # or adls_sink\n","        feature_names=materialized_feature_names,\n","    )\n","\n","    client.materialize_features(\n","        settings=settings,\n","        # Note, execution_configurations argument only works when using a new job cluster\n","        execution_configurations={\"spark.feathr.outputFormat\": \"parquet\"},\n","    )\n","\n","    client.wait_job_to_finish(timeout_sec=500)"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"5aa13acd-58ec-4fc2-86bb-dc1d9951ebb9","showTitle":false,"title":""}},"source":["Now, you can retrieve features for online scoring as follows:"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"424bc9eb-a47f-4b46-be69-8218d55e66ad","showTitle":false,"title":""}},"outputs":[],"source":["if REDIS_KEY and RESOURCE_PREFIX:\n","    # Note, to get a single key, you may use client.get_online_features instead\n","    materialized_feature_values = client.multi_get_online_features(\n","        feature_table=FEATURE_TABLE_NAME,\n","        keys=[\"239\", \"265\"],\n","        feature_names=materialized_feature_names,\n","    )\n","    materialized_feature_values"]},{"cell_type":"markdown","metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"3596dc71-a363-4b6a-a169-215c89978558","showTitle":false,"title":""}},"source":["## Cleanup"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"inputWidgets":{},"nuid":"b5fb292e-bbb6-4dd7-8e79-c62d9533e820","showTitle":false,"title":""}},"outputs":[],"source":["# Remove temporary files\n","dbutils.fs.rm(\"dbfs:/tmp/\", recurse=True)"]}],"metadata":{"application/vnd.databricks.v1+notebook":{"dashboards":[],"language":"python","notebookMetadata":{"pythonIndentUnit":4},"notebookName":"databricks_quickstart_nyc_taxi_demo","notebookOrigID":2365994027381987,"widgets":{"REDIS_KEY":{"currentValue":"","nuid":"d39ce0d5-bcfe-47ef-b3d9-eff67e5cdeca","widgetInfo":{"defaultValue":"","label":null,"name":"REDIS_KEY","options":{"validationRegex":null,"widgetType":"text"},"widgetType":"text"}},"RESOURCE_PREFIX":{"currentValue":"","nuid":"87a26035-86fc-4dbd-8dd0-dc546c1c63c1","widgetInfo":{"defaultValue":"","label":null,"name":"RESOURCE_PREFIX","options":{"validationRegex":null,"widgetType":"text"},"widgetType":"text"}}}},"kernelspec":{"display_name":"Python 3.10.8 64-bit","language":"python","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.10.8"},"vscode":{"interpreter":{"hash":"b0fa6594d8f4cbf19f97940f81e996739fb7646882a419484c72d19e05852a7e"}}},"nbformat":4,"nbformat_minor":0}
diff --git a/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb b/docs/samples/nyc_driver_demo.ipynb
similarity index 99%
rename from feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
rename to docs/samples/nyc_driver_demo.ipynb
index 38cec2ca9..e5fa7904b 100644
--- a/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb
+++ b/docs/samples/nyc_driver_demo.ipynb
@@ -693,7 +693,7 @@
   ],
   "metadata": {
     "kernelspec": {
-      "display_name": "Python 3.9.5 ('base')",
+      "display_name": "Python 3.10.8 64-bit",
       "language": "python",
       "name": "python3"
     },
@@ -707,11 +707,11 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.9.5"
+      "version": "3.10.8"
     },
     "vscode": {
       "interpreter": {
-        "hash": "3d597f4c481aa0f25dceb95d2a0067e73c0966dcbd003d741d821a7208527ecf"
+        "hash": "b0fa6594d8f4cbf19f97940f81e996739fb7646882a419484c72d19e05852a7e"
       }
     }
   },

From 8f6428d992adc074ca79941b8635e8580f5f29c8 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Tue, 1 Nov 2022 12:06:48 +0800
Subject: [PATCH 55/68] Fix more dead links (#807)

---
 docs/samples/{nyc_driver_demo.ipynb => nyc_taxi_demo.ipynb} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename docs/samples/{nyc_driver_demo.ipynb => nyc_taxi_demo.ipynb} (100%)

diff --git a/docs/samples/nyc_driver_demo.ipynb b/docs/samples/nyc_taxi_demo.ipynb
similarity index 100%
rename from docs/samples/nyc_driver_demo.ipynb
rename to docs/samples/nyc_taxi_demo.ipynb

From 3025bc14181fd248695fc70fa69e633e8ec3359d Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Tue, 1 Nov 2022 18:08:21 +0800
Subject: [PATCH 56/68] Improve UI experience and clean up ui code warnings
 (#801)

* Add DataSourcesSelect and FlowGraph and ResizeTable components. Fix all warning and lint issues.

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Add CardDescriptions component and fix ESlint warning.

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Update FeatureDetails page title.

Signed-off-by: Boli Guan <ifendoe@gmail.com>

* Rename ProjectSelect

Signed-off-by: Boli Guan <ifendoe@gmail.com>

Signed-off-by: Boli Guan <ifendoe@gmail.com>
---
 ui/.eslintrc                                  |   3 +-
 ui/package-lock.json                          | 656 ++++++++++++------
 ui/package.json                               |   8 +-
 ui/src/api/api.tsx                            |  46 +-
 ui/src/components/CardDescriptions/index.tsx  |  32 +
 ui/src/components/FlowGraph/FlowGraph.tsx     | 236 +++++++
 ui/src/components/FlowGraph/LineageNode.tsx   |  57 ++
 ui/src/components/FlowGraph/index.module.less |  43 ++
 ui/src/components/FlowGraph/index.ts          |   5 +
 ui/src/components/FlowGraph/interface.ts      |  30 +
 ui/src/components/FlowGraph/utils.ts          | 192 +++++
 ui/src/components/ProjectsSelect/index.tsx    |  51 ++
 .../components/ResizeTable/ResizableTitle.tsx |  37 +
 .../components/ResizeTable/ResizeHandle.tsx   |  29 +
 ui/src/components/ResizeTable/ResizeTable.tsx |  68 ++
 .../components/ResizeTable/index.module.less  |  22 +
 ui/src/components/ResizeTable/index.tsx       |   5 +
 ui/src/components/ResizeTable/interface.ts    |  22 +
 ui/src/components/graph/graphNodeDetails.tsx  | 107 ++-
 ui/src/components/header/headerWidgetMenu.tsx |  43 +-
 ui/src/components/sidemenu/siteMenu.tsx       | 123 ++--
 ui/src/models/model.ts                        |  14 +-
 .../components/DataSourceTable/index.tsx      | 146 ++++
 .../dataSource/components/SearchBar/index.tsx |  38 +
 ui/src/pages/dataSource/dataSourceDetails.tsx | 169 ++---
 ui/src/pages/dataSource/dataSources.tsx       |  25 +-
 .../feature/components/FeatureForm/index.tsx  |  87 +++
 .../feature/components/FeatureTable/index.tsx | 151 ++++
 .../NodeDetails/FeatureNodeDetail.tsx         |  44 ++
 .../NodeDetails/SourceNodeDetial.tsx          |  22 +
 .../feature/components/NodeDetails/index.tsx  |  63 ++
 .../feature/components/SearchBar/index.tsx    |  67 ++
 ui/src/pages/feature/featureDetails.tsx       | 422 +++++------
 ui/src/pages/feature/features.tsx             |  29 +-
 ui/src/pages/feature/lineageGraph.tsx         | 139 ++--
 ui/src/pages/feature/newFeature.tsx           |  11 +-
 .../management/components/RoleForm/index.tsx  |   2 +-
 .../components/UserRolesTable/index.tsx       |  23 +-
 ui/src/pages/management/management.tsx        |   2 +-
 ui/src/pages/management/roleManagement.tsx    |   2 +-
 .../project/components/ProjectTable/index.tsx |  99 +++
 .../project/components/SearchBar/index.tsx    |  51 ++
 ui/src/pages/project/projects.tsx             |  23 +-
 ui/src/site.css                               |   6 +-
 ui/src/utils/attributesMapping.ts             |  48 ++
 ui/src/utils/utils.tsx                        |  18 +-
 46 files changed, 2655 insertions(+), 861 deletions(-)
 create mode 100644 ui/src/components/CardDescriptions/index.tsx
 create mode 100644 ui/src/components/FlowGraph/FlowGraph.tsx
 create mode 100644 ui/src/components/FlowGraph/LineageNode.tsx
 create mode 100644 ui/src/components/FlowGraph/index.module.less
 create mode 100644 ui/src/components/FlowGraph/index.ts
 create mode 100644 ui/src/components/FlowGraph/interface.ts
 create mode 100644 ui/src/components/FlowGraph/utils.ts
 create mode 100644 ui/src/components/ProjectsSelect/index.tsx
 create mode 100644 ui/src/components/ResizeTable/ResizableTitle.tsx
 create mode 100644 ui/src/components/ResizeTable/ResizeHandle.tsx
 create mode 100644 ui/src/components/ResizeTable/ResizeTable.tsx
 create mode 100644 ui/src/components/ResizeTable/index.module.less
 create mode 100644 ui/src/components/ResizeTable/index.tsx
 create mode 100644 ui/src/components/ResizeTable/interface.ts
 create mode 100644 ui/src/pages/dataSource/components/DataSourceTable/index.tsx
 create mode 100644 ui/src/pages/dataSource/components/SearchBar/index.tsx
 create mode 100644 ui/src/pages/feature/components/FeatureForm/index.tsx
 create mode 100644 ui/src/pages/feature/components/FeatureTable/index.tsx
 create mode 100644 ui/src/pages/feature/components/NodeDetails/FeatureNodeDetail.tsx
 create mode 100644 ui/src/pages/feature/components/NodeDetails/SourceNodeDetial.tsx
 create mode 100644 ui/src/pages/feature/components/NodeDetails/index.tsx
 create mode 100644 ui/src/pages/feature/components/SearchBar/index.tsx
 create mode 100644 ui/src/pages/project/components/ProjectTable/index.tsx
 create mode 100644 ui/src/pages/project/components/SearchBar/index.tsx
 create mode 100644 ui/src/utils/attributesMapping.ts

diff --git a/ui/.eslintrc b/ui/.eslintrc
index 43eeb60eb..c271bfa24 100644
--- a/ui/.eslintrc
+++ b/ui/.eslintrc
@@ -20,7 +20,8 @@
     "react-app",
     // https://reactjs.org/docs/hooks-rules.html
     "plugin:react-hooks/recommended",
-    "plugin:prettier/recommended"
+    "plugin:prettier/recommended",
+    "plugin:json/recommended"
   ],
   "parser": "@typescript-eslint/parser",
   "parserOptions": {
diff --git a/ui/package-lock.json b/ui/package-lock.json
index b1568ad00..480dfdc62 100644
--- a/ui/package-lock.json
+++ b/ui/package-lock.json
@@ -11,7 +11,7 @@
         "@ant-design/icons": "^4.7.0",
         "@azure/msal-browser": "^2.24.0",
         "@azure/msal-react": "^1.4.0",
-        "antd": "^4.20.2",
+        "antd": "^4.23.6",
         "axios": "^0.27.2",
         "classnames": "^2.3.2",
         "dagre": "^0.8.5",
@@ -20,6 +20,7 @@
         "react-dom": "^17.0.2",
         "react-flow-renderer": "^9.7.4",
         "react-query": "^3.38.0",
+        "react-resizable": "^3.0.4",
         "react-router-dom": "^6.3.0"
       },
       "devDependencies": {
@@ -32,6 +33,7 @@
         "@types/node": "^16.11.26",
         "@types/react": "^17.0.43",
         "@types/react-dom": "^17.0.14",
+        "@types/react-resizable": "^3.0.3",
         "@typescript-eslint/eslint-plugin": "^5.30.7",
         "@typescript-eslint/parser": "^5.30.7",
         "babel-plugin-import": "^1.13.5",
@@ -40,6 +42,7 @@
         "eslint-config-prettier": "^8.5.0",
         "eslint-import-resolver-typescript": "^3.5.1",
         "eslint-plugin-import": "^2.26.0",
+        "eslint-plugin-json": "^3.1.0",
         "eslint-plugin-prettier": "^4.2.1",
         "eslint-plugin-react-hooks": "^4.6.0",
         "husky": "^8.0.1",
@@ -94,14 +97,15 @@
       "license": "MIT"
     },
     "node_modules/@ant-design/react-slick": {
-      "version": "0.28.4",
-      "license": "MIT",
+      "version": "0.29.2",
+      "resolved": "https://registry.npmjs.org/@ant-design/react-slick/-/react-slick-0.29.2.tgz",
+      "integrity": "sha512-kgjtKmkGHa19FW21lHnAfyyH9AAoh35pBdcJ53rHmQ3O+cfFHGHnUbj/HFrRNJ5vIts09FKJVAD8RpaC+RaWfA==",
       "dependencies": {
         "@babel/runtime": "^7.10.4",
         "classnames": "^2.2.5",
         "json2mq": "^0.2.0",
         "lodash": "^4.17.21",
-        "resize-observer-polyfill": "^1.5.0"
+        "resize-observer-polyfill": "^1.5.1"
       },
       "peerDependencies": {
         "react": ">=16.9.0"
@@ -1946,10 +1950,11 @@
       }
     },
     "node_modules/@babel/runtime": {
-      "version": "7.17.9",
-      "license": "MIT",
+      "version": "7.20.0",
+      "resolved": "https://registry.npmjs.org/@babel/runtime/-/runtime-7.20.0.tgz",
+      "integrity": "sha512-NDYdls71fTXoU8TZHfbBWg7DiZfNzClcKui/+kyi6ppD2L1qnWW3VV6CjtaBXSUGGhiTWJ6ereOIkUvenif66Q==",
       "dependencies": {
-        "regenerator-runtime": "^0.13.4"
+        "regenerator-runtime": "^0.13.10"
       },
       "engines": {
         "node": ">=6.9.0"
@@ -3607,6 +3612,15 @@
         "redux": "^4.0.0"
       }
     },
+    "node_modules/@types/react-resizable": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/react-resizable/-/react-resizable-3.0.3.tgz",
+      "integrity": "sha512-W/QsUOZoXBAIBQNhNm95A5ohoaiUA874lWQytO2UP9dOjp5JHO9+a0cwYNabea7sA12ZDJnGVUFZxcNaNksAWA==",
+      "dev": true,
+      "dependencies": {
+        "@types/react": "*"
+      }
+    },
     "node_modules/@types/resolve": {
       "version": "1.17.1",
       "dev": true,
@@ -4566,52 +4580,53 @@
       }
     },
     "node_modules/antd": {
-      "version": "4.20.2",
-      "license": "MIT",
+      "version": "4.23.6",
+      "resolved": "https://registry.npmjs.org/antd/-/antd-4.23.6.tgz",
+      "integrity": "sha512-AYH57cWBDe1ChtbnvG8i9dpKG4WnjE3AG0zIKpXByFNnxsr4saV6/19ihE8/ImSGpohN4E2zTXmo7R5/MyVRKQ==",
       "dependencies": {
         "@ant-design/colors": "^6.0.0",
         "@ant-design/icons": "^4.7.0",
-        "@ant-design/react-slick": "~0.28.1",
-        "@babel/runtime": "^7.12.5",
+        "@ant-design/react-slick": "~0.29.1",
+        "@babel/runtime": "^7.18.3",
         "@ctrl/tinycolor": "^3.4.0",
         "classnames": "^2.2.6",
         "copy-to-clipboard": "^3.2.0",
         "lodash": "^4.17.21",
         "memoize-one": "^6.0.0",
         "moment": "^2.29.2",
-        "rc-cascader": "~3.5.0",
+        "rc-cascader": "~3.7.0",
         "rc-checkbox": "~2.3.0",
-        "rc-collapse": "~3.1.0",
-        "rc-dialog": "~8.8.1",
-        "rc-drawer": "~4.4.2",
-        "rc-dropdown": "~3.5.0",
-        "rc-field-form": "~1.26.1",
-        "rc-image": "~5.6.0",
-        "rc-input": "~0.0.1-alpha.5",
-        "rc-input-number": "~7.3.0",
-        "rc-mentions": "~1.7.0",
-        "rc-menu": "~9.5.5",
-        "rc-motion": "^2.5.1",
+        "rc-collapse": "~3.3.0",
+        "rc-dialog": "~8.9.0",
+        "rc-drawer": "~5.1.0",
+        "rc-dropdown": "~4.0.0",
+        "rc-field-form": "~1.27.0",
+        "rc-image": "~5.7.0",
+        "rc-input": "~0.1.2",
+        "rc-input-number": "~7.3.9",
+        "rc-mentions": "~1.10.0",
+        "rc-menu": "~9.6.3",
+        "rc-motion": "^2.6.1",
         "rc-notification": "~4.6.0",
-        "rc-pagination": "~3.1.9",
-        "rc-picker": "~2.6.4",
-        "rc-progress": "~3.2.1",
+        "rc-pagination": "~3.1.17",
+        "rc-picker": "~2.6.11",
+        "rc-progress": "~3.3.2",
         "rc-rate": "~2.9.0",
         "rc-resize-observer": "^1.2.0",
-        "rc-segmented": "~2.1.0 ",
-        "rc-select": "~14.1.1",
+        "rc-segmented": "~2.1.0",
+        "rc-select": "~14.1.13",
         "rc-slider": "~10.0.0",
         "rc-steps": "~4.1.0",
         "rc-switch": "~3.2.0",
-        "rc-table": "~7.24.0",
-        "rc-tabs": "~11.13.0",
-        "rc-textarea": "~0.3.0",
-        "rc-tooltip": "~5.1.1",
-        "rc-tree": "~5.5.0",
-        "rc-tree-select": "~5.3.0",
+        "rc-table": "~7.26.0",
+        "rc-tabs": "~12.2.0",
+        "rc-textarea": "~0.4.5",
+        "rc-tooltip": "~5.2.0",
+        "rc-tree": "~5.7.0",
+        "rc-tree-select": "~5.5.0",
         "rc-trigger": "^5.2.10",
         "rc-upload": "~4.3.0",
-        "rc-util": "^5.20.0",
+        "rc-util": "^5.22.5",
         "scroll-into-view-if-needed": "^2.2.25"
       },
       "funding": {
@@ -4681,7 +4696,8 @@
     },
     "node_modules/array-tree-filter": {
       "version": "2.1.0",
-      "license": "MIT"
+      "resolved": "https://registry.npmjs.org/array-tree-filter/-/array-tree-filter-2.1.0.tgz",
+      "integrity": "sha512-4ROwICNlNw/Hqa9v+rk5h22KjmzB1JGTMVKP2AKJBOCgb0yL0ASf0+YvCcLNNwquOHNX48jkeZIJ3a+oOQqKcw=="
     },
     "node_modules/array-union": {
       "version": "2.1.0",
@@ -4749,8 +4765,9 @@
       "license": "MIT"
     },
     "node_modules/async-validator": {
-      "version": "4.1.1",
-      "license": "MIT"
+      "version": "4.2.5",
+      "resolved": "https://registry.npmjs.org/async-validator/-/async-validator-4.2.5.tgz",
+      "integrity": "sha512-7HhHjtERjqlNbZtqNqy2rckN/SpOOlmDliet+lP7k+eKZEjPk3DgyeU9lIXLdeLz0uBbbVp+9Qdow9wJWgwwfg=="
     },
     "node_modules/asynckit": {
       "version": "0.4.0",
@@ -6520,8 +6537,9 @@
       }
     },
     "node_modules/date-fns": {
-      "version": "2.28.0",
-      "license": "MIT",
+      "version": "2.29.3",
+      "resolved": "https://registry.npmjs.org/date-fns/-/date-fns-2.29.3.tgz",
+      "integrity": "sha512-dDCnyH2WnnKusqvZZ6+jA1O51Ibt8ZMRNkDZdyAyK4YfbDwa/cEmuztzG5pk6hqlp9aSBPYcjOlktquahGwGeA==",
       "engines": {
         "node": ">=0.11"
       },
@@ -7491,6 +7509,19 @@
         }
       }
     },
+    "node_modules/eslint-plugin-json": {
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/eslint-plugin-json/-/eslint-plugin-json-3.1.0.tgz",
+      "integrity": "sha512-MrlG2ynFEHe7wDGwbUuFPsaT2b1uhuEFhJ+W1f1u+1C2EkXmTYJp4B1aAdQQ8M+CC3t//N/oRKiIVw14L2HR1g==",
+      "dev": true,
+      "dependencies": {
+        "lodash": "^4.17.21",
+        "vscode-json-languageservice": "^4.1.6"
+      },
+      "engines": {
+        "node": ">=12.0"
+      }
+    },
     "node_modules/eslint-plugin-jsx-a11y": {
       "version": "6.5.1",
       "dev": true,
@@ -10877,7 +10908,8 @@
     },
     "node_modules/json2mq": {
       "version": "0.2.0",
-      "license": "MIT",
+      "resolved": "https://registry.npmjs.org/json2mq/-/json2mq-0.2.0.tgz",
+      "integrity": "sha512-SzoRg7ux5DWTII9J2qkrZrqV1gt+rTaoufMxEzXbS26Uid0NwaJd123HcoB80TgubEppxxIGdNxCx50fEoEWQA==",
       "dependencies": {
         "string-convert": "^0.2.0"
       }
@@ -10893,6 +10925,12 @@
         "node": ">=6"
       }
     },
+    "node_modules/jsonc-parser": {
+      "version": "3.2.0",
+      "resolved": "https://registry.npmjs.org/jsonc-parser/-/jsonc-parser-3.2.0.tgz",
+      "integrity": "sha512-gfFQZrcTc8CnKXp6Y4/CBT3fTc0OVuDofpre4aEeEpSBPV5X5v4+Vmx+8snU7RLPrNHPKSgLxGo9YuQzz20o+w==",
+      "dev": true
+    },
     "node_modules/jsonfile": {
       "version": "6.1.0",
       "dev": true,
@@ -13833,14 +13871,15 @@
       }
     },
     "node_modules/rc-cascader": {
-      "version": "3.5.0",
-      "license": "MIT",
+      "version": "3.7.0",
+      "resolved": "https://registry.npmjs.org/rc-cascader/-/rc-cascader-3.7.0.tgz",
+      "integrity": "sha512-SFtGpwmYN7RaWEAGTS4Rkc62ZV/qmQGg/tajr/7mfIkleuu8ro9Hlk6J+aA0x1YS4zlaZBtTcSaXM01QMiEV/A==",
       "dependencies": {
         "@babel/runtime": "^7.12.5",
         "array-tree-filter": "^2.1.0",
         "classnames": "^2.3.1",
         "rc-select": "~14.1.0",
-        "rc-tree": "~5.5.0",
+        "rc-tree": "~5.7.0",
         "rc-util": "^5.6.1"
       },
       "peerDependencies": {
@@ -13861,8 +13900,9 @@
       }
     },
     "node_modules/rc-collapse": {
-      "version": "3.1.4",
-      "license": "MIT",
+      "version": "3.3.1",
+      "resolved": "https://registry.npmjs.org/rc-collapse/-/rc-collapse-3.3.1.tgz",
+      "integrity": "sha512-cOJfcSe3R8vocrF8T+PgaHDrgeA1tX+lwfhwSj60NX9QVRidsILIbRNDLD6nAzmcvVC5PWiIRiR4S1OobxdhCg==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
@@ -13876,8 +13916,9 @@
       }
     },
     "node_modules/rc-dialog": {
-      "version": "8.8.1",
-      "license": "MIT",
+      "version": "8.9.0",
+      "resolved": "https://registry.npmjs.org/rc-dialog/-/rc-dialog-8.9.0.tgz",
+      "integrity": "sha512-Cp0tbJnrvPchJfnwIvOMWmJ4yjX3HWFatO6oBFD1jx8QkgsQCR0p8nUWAKdd3seLJhEC39/v56kZaEjwp9muoQ==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
@@ -13890,11 +13931,14 @@
       }
     },
     "node_modules/rc-drawer": {
-      "version": "4.4.3",
+      "version": "5.1.0",
+      "resolved": "https://registry.npmjs.org/rc-drawer/-/rc-drawer-5.1.0.tgz",
+      "integrity": "sha512-pU3Tsn99pxGdYowXehzZbdDVE+4lDXSGb7p8vA9mSmr569oc2Izh4Zw5vLKSe/Xxn2p5MSNbLVqD4tz+pK6SOw==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
-        "rc-util": "^5.7.0"
+        "rc-motion": "^2.6.1",
+        "rc-util": "^5.21.2"
       },
       "peerDependencies": {
         "react": ">=16.9.0",
@@ -13902,12 +13946,13 @@
       }
     },
     "node_modules/rc-dropdown": {
-      "version": "3.5.2",
-      "license": "MIT",
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/rc-dropdown/-/rc-dropdown-4.0.1.tgz",
+      "integrity": "sha512-OdpXuOcme1rm45cR0Jzgfl1otzmU4vuBVb+etXM8vcaULGokAKVpKlw8p6xzspG7jGd/XxShvq+N3VNEfk/l5g==",
       "dependencies": {
-        "@babel/runtime": "^7.10.1",
+        "@babel/runtime": "^7.18.3",
         "classnames": "^2.2.6",
-        "rc-trigger": "^5.0.4",
+        "rc-trigger": "^5.3.1",
         "rc-util": "^5.17.0"
       },
       "peerDependencies": {
@@ -13916,10 +13961,11 @@
       }
     },
     "node_modules/rc-field-form": {
-      "version": "1.26.3",
-      "license": "MIT",
+      "version": "1.27.3",
+      "resolved": "https://registry.npmjs.org/rc-field-form/-/rc-field-form-1.27.3.tgz",
+      "integrity": "sha512-HGqxHnmGQgkPApEcikV4qTg3BLPC82uB/cwBDftDt1pYaqitJfSl5TFTTUMKVEJVT5RqJ2Zi68ME1HmIMX2HAw==",
       "dependencies": {
-        "@babel/runtime": "^7.8.4",
+        "@babel/runtime": "^7.18.0",
         "async-validator": "^4.1.0",
         "rc-util": "^5.8.0"
       },
@@ -13932,12 +13978,13 @@
       }
     },
     "node_modules/rc-image": {
-      "version": "5.6.2",
-      "license": "MIT",
+      "version": "5.7.1",
+      "resolved": "https://registry.npmjs.org/rc-image/-/rc-image-5.7.1.tgz",
+      "integrity": "sha512-QyMfdhoUfb5W14plqXSisaYwpdstcLYnB0MjX5ccIK2rydQM9sDPuekQWu500DDGR2dBaIF5vx9XbWkNFK17Fg==",
       "dependencies": {
         "@babel/runtime": "^7.11.2",
         "classnames": "^2.2.6",
-        "rc-dialog": "~8.8.0",
+        "rc-dialog": "~8.9.0",
         "rc-util": "^5.0.6"
       },
       "peerDependencies": {
@@ -13946,8 +13993,9 @@
       }
     },
     "node_modules/rc-input": {
-      "version": "0.0.1-alpha.7",
-      "license": "MIT",
+      "version": "0.1.4",
+      "resolved": "https://registry.npmjs.org/rc-input/-/rc-input-0.1.4.tgz",
+      "integrity": "sha512-FqDdNz+fV2dKNgfXzcSLKvC+jEs1709t7nD+WdfjrdSaOcefpgc7BUJYadc3usaING+b7ediMTfKxuJBsEFbXA==",
       "dependencies": {
         "@babel/runtime": "^7.11.1",
         "classnames": "^2.2.1",
@@ -13959,12 +14007,13 @@
       }
     },
     "node_modules/rc-input-number": {
-      "version": "7.3.4",
-      "license": "MIT",
+      "version": "7.3.9",
+      "resolved": "https://registry.npmjs.org/rc-input-number/-/rc-input-number-7.3.9.tgz",
+      "integrity": "sha512-u0+miS+SATdb6DtssYei2JJ1WuZME+nXaG6XGtR8maNyW5uGDytfDu60OTWLQEb0Anv/AcCzehldV8CKmKyQfA==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.5",
-        "rc-util": "^5.9.8"
+        "rc-util": "^5.23.0"
       },
       "peerDependencies": {
         "react": ">=16.9.0",
@@ -13972,15 +14021,16 @@
       }
     },
     "node_modules/rc-mentions": {
-      "version": "1.7.1",
-      "license": "MIT",
+      "version": "1.10.0",
+      "resolved": "https://registry.npmjs.org/rc-mentions/-/rc-mentions-1.10.0.tgz",
+      "integrity": "sha512-oMlYWnwXSxP2NQVlgxOTzuG/u9BUc3ySY78K3/t7MNhJWpZzXTao+/Bic6tyZLuNCO89//hVQJBdaR2rnFQl6Q==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
-        "rc-menu": "~9.5.1",
-        "rc-textarea": "^0.3.0",
+        "rc-menu": "~9.6.0",
+        "rc-textarea": "^0.4.0",
         "rc-trigger": "^5.0.4",
-        "rc-util": "^5.0.1"
+        "rc-util": "^5.22.5"
       },
       "peerDependencies": {
         "react": ">=16.9.0",
@@ -13988,8 +14038,9 @@
       }
     },
     "node_modules/rc-menu": {
-      "version": "9.5.5",
-      "license": "MIT",
+      "version": "9.6.4",
+      "resolved": "https://registry.npmjs.org/rc-menu/-/rc-menu-9.6.4.tgz",
+      "integrity": "sha512-6DiNAjxjVIPLZXHffXxxcyE15d4isRL7iQ1ru4MqYDH2Cqc5bW96wZOdMydFtGLyDdnmEQ9jVvdCE9yliGvzkw==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
@@ -14005,8 +14056,9 @@
       }
     },
     "node_modules/rc-motion": {
-      "version": "2.6.0",
-      "license": "MIT",
+      "version": "2.6.2",
+      "resolved": "https://registry.npmjs.org/rc-motion/-/rc-motion-2.6.2.tgz",
+      "integrity": "sha512-4w1FaX3dtV749P8GwfS4fYnFG4Rb9pxvCYPc/b2fw1cmlHJWNNgOFIz7ysiD+eOrzJSvnLJWlNQQncpNMXwwpg==",
       "dependencies": {
         "@babel/runtime": "^7.11.1",
         "classnames": "^2.2.1",
@@ -14035,8 +14087,9 @@
       }
     },
     "node_modules/rc-overflow": {
-      "version": "1.2.5",
-      "license": "MIT",
+      "version": "1.2.8",
+      "resolved": "https://registry.npmjs.org/rc-overflow/-/rc-overflow-1.2.8.tgz",
+      "integrity": "sha512-QJ0UItckWPQ37ZL1dMEBAdY1dhfTXFL9k6oTTcyydVwoUNMnMqCGqnRNA98axSr/OeDKqR6DVFyi8eA5RQI/uQ==",
       "dependencies": {
         "@babel/runtime": "^7.11.1",
         "classnames": "^2.2.1",
@@ -14049,8 +14102,9 @@
       }
     },
     "node_modules/rc-pagination": {
-      "version": "3.1.16",
-      "license": "MIT",
+      "version": "3.1.17",
+      "resolved": "https://registry.npmjs.org/rc-pagination/-/rc-pagination-3.1.17.tgz",
+      "integrity": "sha512-/BQ5UxcBnW28vFAcP2hfh+Xg15W0QZn8TWYwdCApchMH1H0CxiaUUcULP8uXcFM1TygcdKWdt3JqsL9cTAfdkQ==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1"
@@ -14061,8 +14115,9 @@
       }
     },
     "node_modules/rc-picker": {
-      "version": "2.6.8",
-      "license": "MIT",
+      "version": "2.6.11",
+      "resolved": "https://registry.npmjs.org/rc-picker/-/rc-picker-2.6.11.tgz",
+      "integrity": "sha512-INJ7ULu+Kj4UgqbcqE8Q+QpMw55xFf9kkyLBHJFk0ihjJpAV4glialRfqHE7k4KX2BWYPQfpILwhwR14x2EiRQ==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1",
@@ -14082,8 +14137,9 @@
       }
     },
     "node_modules/rc-progress": {
-      "version": "3.2.4",
-      "license": "MIT",
+      "version": "3.3.3",
+      "resolved": "https://registry.npmjs.org/rc-progress/-/rc-progress-3.3.3.tgz",
+      "integrity": "sha512-MDVNVHzGanYtRy2KKraEaWeZLri2ZHWIRyaE1a9MQ2MuJ09m+Wxj5cfcaoaR6z5iRpHpA59YeUxAlpML8N4PJw==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
@@ -14112,7 +14168,8 @@
     },
     "node_modules/rc-resize-observer": {
       "version": "1.2.0",
-      "license": "MIT",
+      "resolved": "https://registry.npmjs.org/rc-resize-observer/-/rc-resize-observer-1.2.0.tgz",
+      "integrity": "sha512-6W+UzT3PyDM0wVCEHfoW3qTHPTvbdSgiA43buiy8PzmeMnfgnDeb9NjdimMXMl3/TcrvvWl5RRVdp+NqcR47pQ==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1",
@@ -14139,8 +14196,9 @@
       }
     },
     "node_modules/rc-select": {
-      "version": "14.1.2",
-      "license": "MIT",
+      "version": "14.1.13",
+      "resolved": "https://registry.npmjs.org/rc-select/-/rc-select-14.1.13.tgz",
+      "integrity": "sha512-WMEsC3gTwA1dbzWOdVIXDmWyidYNLq68AwvvUlRROw790uGUly0/vmqDozXrIr0QvN/A3CEULx12o+WtLCAefg==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
@@ -14206,13 +14264,14 @@
       }
     },
     "node_modules/rc-table": {
-      "version": "7.24.1",
-      "license": "MIT",
+      "version": "7.26.0",
+      "resolved": "https://registry.npmjs.org/rc-table/-/rc-table-7.26.0.tgz",
+      "integrity": "sha512-0cD8e6S+DTGAt5nBZQIPFYEaIukn17sfa5uFL98faHlH/whZzD8ii3dbFL4wmUDEL4BLybhYop+QUfZJ4CPvNQ==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.5",
         "rc-resize-observer": "^1.1.0",
-        "rc-util": "^5.14.0",
+        "rc-util": "^5.22.5",
         "shallowequal": "^1.1.0"
       },
       "engines": {
@@ -14224,13 +14283,15 @@
       }
     },
     "node_modules/rc-tabs": {
-      "version": "11.13.0",
-      "license": "MIT",
+      "version": "12.2.1",
+      "resolved": "https://registry.npmjs.org/rc-tabs/-/rc-tabs-12.2.1.tgz",
+      "integrity": "sha512-09pVv4kN8VFqp6THceEmxOW8PAShQC08hrroeVYP4Y8YBFaP1PIWdyFL01czcbyz5YZFj9flZ7aljMaAl0jLVg==",
       "dependencies": {
         "@babel/runtime": "^7.11.2",
         "classnames": "2.x",
-        "rc-dropdown": "~3.5.0",
-        "rc-menu": "~9.5.1",
+        "rc-dropdown": "~4.0.0",
+        "rc-menu": "~9.6.0",
+        "rc-motion": "^2.6.2",
         "rc-resize-observer": "^1.0.0",
         "rc-util": "^5.5.0"
       },
@@ -14243,13 +14304,14 @@
       }
     },
     "node_modules/rc-textarea": {
-      "version": "0.3.7",
-      "license": "MIT",
+      "version": "0.4.6",
+      "resolved": "https://registry.npmjs.org/rc-textarea/-/rc-textarea-0.4.6.tgz",
+      "integrity": "sha512-HEKCu8nouXXayqYelQnhQm8fdH7v92pAQvfVCz+jhIPv2PHTyBxVrmoZJMn3B8cU+wdyuvRGkshngO3/TzBn4w==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1",
         "rc-resize-observer": "^1.0.0",
-        "rc-util": "^5.7.0",
+        "rc-util": "^5.24.4",
         "shallowequal": "^1.1.0"
       },
       "peerDependencies": {
@@ -14258,10 +14320,12 @@
       }
     },
     "node_modules/rc-tooltip": {
-      "version": "5.1.1",
-      "license": "MIT",
+      "version": "5.2.2",
+      "resolved": "https://registry.npmjs.org/rc-tooltip/-/rc-tooltip-5.2.2.tgz",
+      "integrity": "sha512-jtQzU/18S6EI3lhSGoDYhPqNpWajMtS5VV/ld1LwyfrDByQpYmw/LW6U7oFXXLukjfDHQ7Ju705A82PRNFWYhg==",
       "dependencies": {
         "@babel/runtime": "^7.11.2",
+        "classnames": "^2.3.1",
         "rc-trigger": "^5.0.0"
       },
       "peerDependencies": {
@@ -14270,14 +14334,15 @@
       }
     },
     "node_modules/rc-tree": {
-      "version": "5.5.0",
-      "license": "MIT",
+      "version": "5.7.0",
+      "resolved": "https://registry.npmjs.org/rc-tree/-/rc-tree-5.7.0.tgz",
+      "integrity": "sha512-F+Ewkv/UcutshnVBMISP+lPdHDlcsL+YH/MQDVWbk+QdkfID7vXiwrHMEZn31+2Rbbm21z/HPceGS8PXGMmnQg==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
         "rc-motion": "^2.0.1",
         "rc-util": "^5.16.1",
-        "rc-virtual-list": "^3.4.2"
+        "rc-virtual-list": "^3.4.8"
       },
       "engines": {
         "node": ">=10.x"
@@ -14288,13 +14353,14 @@
       }
     },
     "node_modules/rc-tree-select": {
-      "version": "5.3.0",
-      "license": "MIT",
+      "version": "5.5.3",
+      "resolved": "https://registry.npmjs.org/rc-tree-select/-/rc-tree-select-5.5.3.tgz",
+      "integrity": "sha512-gv8KyC6J7f9e50OkGk1ibF7v8vL+iaBnA8Ep/EVlMma2/tGdBQXO9xIvPjX8eQrZL5PjoeTUndNPM3cY3721ng==",
       "dependencies": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
         "rc-select": "~14.1.0",
-        "rc-tree": "~5.5.0",
+        "rc-tree": "~5.7.0",
         "rc-util": "^5.16.1"
       },
       "peerDependencies": {
@@ -14303,10 +14369,11 @@
       }
     },
     "node_modules/rc-trigger": {
-      "version": "5.2.18",
-      "license": "MIT",
+      "version": "5.3.3",
+      "resolved": "https://registry.npmjs.org/rc-trigger/-/rc-trigger-5.3.3.tgz",
+      "integrity": "sha512-IC4nuTSAME7RJSgwvHCNDQrIzhvGMKf6NDu5veX+zk1MG7i1UnwTWWthcP9WHw3+FZfP3oZGvkrHFPu/EGkFKw==",
       "dependencies": {
-        "@babel/runtime": "^7.11.2",
+        "@babel/runtime": "^7.18.3",
         "classnames": "^2.2.6",
         "rc-align": "^4.0.0",
         "rc-motion": "^2.0.0",
@@ -14334,10 +14401,11 @@
       }
     },
     "node_modules/rc-util": {
-      "version": "5.21.2",
-      "license": "MIT",
+      "version": "5.24.4",
+      "resolved": "https://registry.npmjs.org/rc-util/-/rc-util-5.24.4.tgz",
+      "integrity": "sha512-2a4RQnycV9eV7lVZPEJ7QwJRPlZNc06J7CwcwZo4vIHr3PfUqtYgl1EkUV9ETAc6VRRi8XZOMFhYG63whlIC9Q==",
       "dependencies": {
-        "@babel/runtime": "^7.12.5",
+        "@babel/runtime": "^7.18.3",
         "react-is": "^16.12.0",
         "shallowequal": "^1.1.0"
       },
@@ -14347,9 +14415,11 @@
       }
     },
     "node_modules/rc-virtual-list": {
-      "version": "3.4.7",
-      "license": "MIT",
+      "version": "3.4.11",
+      "resolved": "https://registry.npmjs.org/rc-virtual-list/-/rc-virtual-list-3.4.11.tgz",
+      "integrity": "sha512-BvUUH60kkeTBPigN5F89HtGaA5jSP4y2aM6cJ4dk9Y42I9yY+h6i08wF6UKeDcxdfOU8j3I5HxkSS/xA77J3wA==",
       "dependencies": {
+        "@babel/runtime": "^7.20.0",
         "classnames": "^2.2.6",
         "rc-resize-observer": "^1.0.0",
         "rc-util": "^5.15.0"
@@ -14570,6 +14640,18 @@
         "node": ">=0.10.0"
       }
     },
+    "node_modules/react-resizable": {
+      "version": "3.0.4",
+      "resolved": "https://registry.npmjs.org/react-resizable/-/react-resizable-3.0.4.tgz",
+      "integrity": "sha512-StnwmiESiamNzdRHbSSvA65b0ZQJ7eVQpPusrSmcpyGKzC0gojhtO62xxH6YOBmepk9dQTBi9yxidL3W4s3EBA==",
+      "dependencies": {
+        "prop-types": "15.x",
+        "react-draggable": "^4.0.3"
+      },
+      "peerDependencies": {
+        "react": ">= 16.3"
+      }
+    },
     "node_modules/react-router": {
       "version": "6.3.0",
       "license": "MIT",
@@ -14746,8 +14828,9 @@
       }
     },
     "node_modules/regenerator-runtime": {
-      "version": "0.13.9",
-      "license": "MIT"
+      "version": "0.13.10",
+      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.13.10.tgz",
+      "integrity": "sha512-KepLsg4dU12hryUO7bp/axHAKvwGOCV0sGloQtpagJ12ai+ojVDqkeGSiRX1zlq+kjIMZ1t7gpze+26QqtdGqw=="
     },
     "node_modules/regenerator-transform": {
       "version": "0.15.0",
@@ -15761,7 +15844,8 @@
     },
     "node_modules/string-convert": {
       "version": "0.2.1",
-      "license": "MIT"
+      "resolved": "https://registry.npmjs.org/string-convert/-/string-convert-0.2.1.tgz",
+      "integrity": "sha512-u/1tdPl4yQnPBjnVrmdLo9gtuLvELKsAoRapekWggdiQNvvvum+jYF329d84NAa660KQw7pB2n36KrIKVoXa3A=="
     },
     "node_modules/string-length": {
       "version": "4.0.2",
@@ -16735,6 +16819,43 @@
         "node": ">= 0.8"
       }
     },
+    "node_modules/vscode-json-languageservice": {
+      "version": "4.2.1",
+      "resolved": "https://registry.npmjs.org/vscode-json-languageservice/-/vscode-json-languageservice-4.2.1.tgz",
+      "integrity": "sha512-xGmv9QIWs2H8obGbWg+sIPI/3/pFgj/5OWBhNzs00BkYQ9UaB2F6JJaGB/2/YOZJ3BvLXQTC4Q7muqU25QgAhA==",
+      "dev": true,
+      "dependencies": {
+        "jsonc-parser": "^3.0.0",
+        "vscode-languageserver-textdocument": "^1.0.3",
+        "vscode-languageserver-types": "^3.16.0",
+        "vscode-nls": "^5.0.0",
+        "vscode-uri": "^3.0.3"
+      }
+    },
+    "node_modules/vscode-languageserver-textdocument": {
+      "version": "1.0.7",
+      "resolved": "https://registry.npmjs.org/vscode-languageserver-textdocument/-/vscode-languageserver-textdocument-1.0.7.tgz",
+      "integrity": "sha512-bFJH7UQxlXT8kKeyiyu41r22jCZXG8kuuVVA33OEJn1diWOZK5n8zBSPZFHVBOu8kXZ6h0LIRhf5UnCo61J4Hg==",
+      "dev": true
+    },
+    "node_modules/vscode-languageserver-types": {
+      "version": "3.17.2",
+      "resolved": "https://registry.npmjs.org/vscode-languageserver-types/-/vscode-languageserver-types-3.17.2.tgz",
+      "integrity": "sha512-zHhCWatviizPIq9B7Vh9uvrH6x3sK8itC84HkamnBWoDFJtzBf7SWlpLCZUit72b3os45h6RWQNC9xHRDF8dRA==",
+      "dev": true
+    },
+    "node_modules/vscode-nls": {
+      "version": "5.2.0",
+      "resolved": "https://registry.npmjs.org/vscode-nls/-/vscode-nls-5.2.0.tgz",
+      "integrity": "sha512-RAaHx7B14ZU04EU31pT+rKz2/zSl7xMsfIZuo8pd+KZO6PXtQmpevpq3vxvWNcrGbdmhM/rr5Uw5Mz+NBfhVng==",
+      "dev": true
+    },
+    "node_modules/vscode-uri": {
+      "version": "3.0.6",
+      "resolved": "https://registry.npmjs.org/vscode-uri/-/vscode-uri-3.0.6.tgz",
+      "integrity": "sha512-fmL7V1eiDBFRRnu+gfRWTzyPpNIHJTc4mWnFkwBUmO9U3KPgJAmTx7oxi2bl/Rh6HLdU7+4C9wlj0k2E4AdKFQ==",
+      "dev": true
+    },
     "node_modules/w3c-hr-time": {
       "version": "1.0.2",
       "dev": true,
@@ -17543,13 +17664,15 @@
       "version": "4.2.1"
     },
     "@ant-design/react-slick": {
-      "version": "0.28.4",
+      "version": "0.29.2",
+      "resolved": "https://registry.npmjs.org/@ant-design/react-slick/-/react-slick-0.29.2.tgz",
+      "integrity": "sha512-kgjtKmkGHa19FW21lHnAfyyH9AAoh35pBdcJ53rHmQ3O+cfFHGHnUbj/HFrRNJ5vIts09FKJVAD8RpaC+RaWfA==",
       "requires": {
         "@babel/runtime": "^7.10.4",
         "classnames": "^2.2.5",
         "json2mq": "^0.2.0",
         "lodash": "^4.17.21",
-        "resize-observer-polyfill": "^1.5.0"
+        "resize-observer-polyfill": "^1.5.1"
       }
     },
     "@apideck/better-ajv-errors": {
@@ -18653,9 +18776,11 @@
       }
     },
     "@babel/runtime": {
-      "version": "7.17.9",
+      "version": "7.20.0",
+      "resolved": "https://registry.npmjs.org/@babel/runtime/-/runtime-7.20.0.tgz",
+      "integrity": "sha512-NDYdls71fTXoU8TZHfbBWg7DiZfNzClcKui/+kyi6ppD2L1qnWW3VV6CjtaBXSUGGhiTWJ6ereOIkUvenif66Q==",
       "requires": {
-        "regenerator-runtime": "^0.13.4"
+        "regenerator-runtime": "^0.13.10"
       }
     },
     "@babel/runtime-corejs3": {
@@ -19755,6 +19880,15 @@
         "redux": "^4.0.0"
       }
     },
+    "@types/react-resizable": {
+      "version": "3.0.3",
+      "resolved": "https://registry.npmjs.org/@types/react-resizable/-/react-resizable-3.0.3.tgz",
+      "integrity": "sha512-W/QsUOZoXBAIBQNhNm95A5ohoaiUA874lWQytO2UP9dOjp5JHO9+a0cwYNabea7sA12ZDJnGVUFZxcNaNksAWA==",
+      "dev": true,
+      "requires": {
+        "@types/react": "*"
+      }
+    },
     "@types/resolve": {
       "version": "1.17.1",
       "dev": true,
@@ -20335,51 +20469,53 @@
       }
     },
     "antd": {
-      "version": "4.20.2",
+      "version": "4.23.6",
+      "resolved": "https://registry.npmjs.org/antd/-/antd-4.23.6.tgz",
+      "integrity": "sha512-AYH57cWBDe1ChtbnvG8i9dpKG4WnjE3AG0zIKpXByFNnxsr4saV6/19ihE8/ImSGpohN4E2zTXmo7R5/MyVRKQ==",
       "requires": {
         "@ant-design/colors": "^6.0.0",
         "@ant-design/icons": "^4.7.0",
-        "@ant-design/react-slick": "~0.28.1",
-        "@babel/runtime": "^7.12.5",
+        "@ant-design/react-slick": "~0.29.1",
+        "@babel/runtime": "^7.18.3",
         "@ctrl/tinycolor": "^3.4.0",
         "classnames": "^2.2.6",
         "copy-to-clipboard": "^3.2.0",
         "lodash": "^4.17.21",
         "memoize-one": "^6.0.0",
         "moment": "^2.29.2",
-        "rc-cascader": "~3.5.0",
+        "rc-cascader": "~3.7.0",
         "rc-checkbox": "~2.3.0",
-        "rc-collapse": "~3.1.0",
-        "rc-dialog": "~8.8.1",
-        "rc-drawer": "~4.4.2",
-        "rc-dropdown": "~3.5.0",
-        "rc-field-form": "~1.26.1",
-        "rc-image": "~5.6.0",
-        "rc-input": "~0.0.1-alpha.5",
-        "rc-input-number": "~7.3.0",
-        "rc-mentions": "~1.7.0",
-        "rc-menu": "~9.5.5",
-        "rc-motion": "^2.5.1",
+        "rc-collapse": "~3.3.0",
+        "rc-dialog": "~8.9.0",
+        "rc-drawer": "~5.1.0",
+        "rc-dropdown": "~4.0.0",
+        "rc-field-form": "~1.27.0",
+        "rc-image": "~5.7.0",
+        "rc-input": "~0.1.2",
+        "rc-input-number": "~7.3.9",
+        "rc-mentions": "~1.10.0",
+        "rc-menu": "~9.6.3",
+        "rc-motion": "^2.6.1",
         "rc-notification": "~4.6.0",
-        "rc-pagination": "~3.1.9",
-        "rc-picker": "~2.6.4",
-        "rc-progress": "~3.2.1",
+        "rc-pagination": "~3.1.17",
+        "rc-picker": "~2.6.11",
+        "rc-progress": "~3.3.2",
         "rc-rate": "~2.9.0",
         "rc-resize-observer": "^1.2.0",
-        "rc-segmented": "~2.1.0 ",
-        "rc-select": "~14.1.1",
+        "rc-segmented": "~2.1.0",
+        "rc-select": "~14.1.13",
         "rc-slider": "~10.0.0",
         "rc-steps": "~4.1.0",
         "rc-switch": "~3.2.0",
-        "rc-table": "~7.24.0",
-        "rc-tabs": "~11.13.0",
-        "rc-textarea": "~0.3.0",
-        "rc-tooltip": "~5.1.1",
-        "rc-tree": "~5.5.0",
-        "rc-tree-select": "~5.3.0",
+        "rc-table": "~7.26.0",
+        "rc-tabs": "~12.2.0",
+        "rc-textarea": "~0.4.5",
+        "rc-tooltip": "~5.2.0",
+        "rc-tree": "~5.7.0",
+        "rc-tree-select": "~5.5.0",
         "rc-trigger": "^5.2.10",
         "rc-upload": "~4.3.0",
-        "rc-util": "^5.20.0",
+        "rc-util": "^5.22.5",
         "scroll-into-view-if-needed": "^2.2.25"
       }
     },
@@ -20422,7 +20558,9 @@
       }
     },
     "array-tree-filter": {
-      "version": "2.1.0"
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/array-tree-filter/-/array-tree-filter-2.1.0.tgz",
+      "integrity": "sha512-4ROwICNlNw/Hqa9v+rk5h22KjmzB1JGTMVKP2AKJBOCgb0yL0ASf0+YvCcLNNwquOHNX48jkeZIJ3a+oOQqKcw=="
     },
     "array-union": {
       "version": "2.1.0",
@@ -20465,7 +20603,9 @@
       "dev": true
     },
     "async-validator": {
-      "version": "4.1.1"
+      "version": "4.2.5",
+      "resolved": "https://registry.npmjs.org/async-validator/-/async-validator-4.2.5.tgz",
+      "integrity": "sha512-7HhHjtERjqlNbZtqNqy2rckN/SpOOlmDliet+lP7k+eKZEjPk3DgyeU9lIXLdeLz0uBbbVp+9Qdow9wJWgwwfg=="
     },
     "asynckit": {
       "version": "0.4.0"
@@ -21606,7 +21746,9 @@
       }
     },
     "date-fns": {
-      "version": "2.28.0"
+      "version": "2.29.3",
+      "resolved": "https://registry.npmjs.org/date-fns/-/date-fns-2.29.3.tgz",
+      "integrity": "sha512-dDCnyH2WnnKusqvZZ6+jA1O51Ibt8ZMRNkDZdyAyK4YfbDwa/cEmuztzG5pk6hqlp9aSBPYcjOlktquahGwGeA=="
     },
     "dayjs": {
       "version": "1.11.5",
@@ -22303,6 +22445,16 @@
         "@typescript-eslint/experimental-utils": "^5.0.0"
       }
     },
+    "eslint-plugin-json": {
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/eslint-plugin-json/-/eslint-plugin-json-3.1.0.tgz",
+      "integrity": "sha512-MrlG2ynFEHe7wDGwbUuFPsaT2b1uhuEFhJ+W1f1u+1C2EkXmTYJp4B1aAdQQ8M+CC3t//N/oRKiIVw14L2HR1g==",
+      "dev": true,
+      "requires": {
+        "lodash": "^4.17.21",
+        "vscode-json-languageservice": "^4.1.6"
+      }
+    },
     "eslint-plugin-jsx-a11y": {
       "version": "6.5.1",
       "dev": true,
@@ -24453,6 +24605,8 @@
     },
     "json2mq": {
       "version": "0.2.0",
+      "resolved": "https://registry.npmjs.org/json2mq/-/json2mq-0.2.0.tgz",
+      "integrity": "sha512-SzoRg7ux5DWTII9J2qkrZrqV1gt+rTaoufMxEzXbS26Uid0NwaJd123HcoB80TgubEppxxIGdNxCx50fEoEWQA==",
       "requires": {
         "string-convert": "^0.2.0"
       }
@@ -24461,6 +24615,12 @@
       "version": "2.2.1",
       "dev": true
     },
+    "jsonc-parser": {
+      "version": "3.2.0",
+      "resolved": "https://registry.npmjs.org/jsonc-parser/-/jsonc-parser-3.2.0.tgz",
+      "integrity": "sha512-gfFQZrcTc8CnKXp6Y4/CBT3fTc0OVuDofpre4aEeEpSBPV5X5v4+Vmx+8snU7RLPrNHPKSgLxGo9YuQzz20o+w==",
+      "dev": true
+    },
     "jsonfile": {
       "version": "6.1.0",
       "dev": true,
@@ -26190,13 +26350,15 @@
       }
     },
     "rc-cascader": {
-      "version": "3.5.0",
+      "version": "3.7.0",
+      "resolved": "https://registry.npmjs.org/rc-cascader/-/rc-cascader-3.7.0.tgz",
+      "integrity": "sha512-SFtGpwmYN7RaWEAGTS4Rkc62ZV/qmQGg/tajr/7mfIkleuu8ro9Hlk6J+aA0x1YS4zlaZBtTcSaXM01QMiEV/A==",
       "requires": {
         "@babel/runtime": "^7.12.5",
         "array-tree-filter": "^2.1.0",
         "classnames": "^2.3.1",
         "rc-select": "~14.1.0",
-        "rc-tree": "~5.5.0",
+        "rc-tree": "~5.7.0",
         "rc-util": "^5.6.1"
       }
     },
@@ -26208,7 +26370,9 @@
       }
     },
     "rc-collapse": {
-      "version": "3.1.4",
+      "version": "3.3.1",
+      "resolved": "https://registry.npmjs.org/rc-collapse/-/rc-collapse-3.3.1.tgz",
+      "integrity": "sha512-cOJfcSe3R8vocrF8T+PgaHDrgeA1tX+lwfhwSj60NX9QVRidsILIbRNDLD6nAzmcvVC5PWiIRiR4S1OobxdhCg==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
@@ -26218,7 +26382,9 @@
       }
     },
     "rc-dialog": {
-      "version": "8.8.1",
+      "version": "8.9.0",
+      "resolved": "https://registry.npmjs.org/rc-dialog/-/rc-dialog-8.9.0.tgz",
+      "integrity": "sha512-Cp0tbJnrvPchJfnwIvOMWmJ4yjX3HWFatO6oBFD1jx8QkgsQCR0p8nUWAKdd3seLJhEC39/v56kZaEjwp9muoQ==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
@@ -26227,41 +26393,52 @@
       }
     },
     "rc-drawer": {
-      "version": "4.4.3",
+      "version": "5.1.0",
+      "resolved": "https://registry.npmjs.org/rc-drawer/-/rc-drawer-5.1.0.tgz",
+      "integrity": "sha512-pU3Tsn99pxGdYowXehzZbdDVE+4lDXSGb7p8vA9mSmr569oc2Izh4Zw5vLKSe/Xxn2p5MSNbLVqD4tz+pK6SOw==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
-        "rc-util": "^5.7.0"
+        "rc-motion": "^2.6.1",
+        "rc-util": "^5.21.2"
       }
     },
     "rc-dropdown": {
-      "version": "3.5.2",
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/rc-dropdown/-/rc-dropdown-4.0.1.tgz",
+      "integrity": "sha512-OdpXuOcme1rm45cR0Jzgfl1otzmU4vuBVb+etXM8vcaULGokAKVpKlw8p6xzspG7jGd/XxShvq+N3VNEfk/l5g==",
       "requires": {
-        "@babel/runtime": "^7.10.1",
+        "@babel/runtime": "^7.18.3",
         "classnames": "^2.2.6",
-        "rc-trigger": "^5.0.4",
+        "rc-trigger": "^5.3.1",
         "rc-util": "^5.17.0"
       }
     },
     "rc-field-form": {
-      "version": "1.26.3",
+      "version": "1.27.3",
+      "resolved": "https://registry.npmjs.org/rc-field-form/-/rc-field-form-1.27.3.tgz",
+      "integrity": "sha512-HGqxHnmGQgkPApEcikV4qTg3BLPC82uB/cwBDftDt1pYaqitJfSl5TFTTUMKVEJVT5RqJ2Zi68ME1HmIMX2HAw==",
       "requires": {
-        "@babel/runtime": "^7.8.4",
+        "@babel/runtime": "^7.18.0",
         "async-validator": "^4.1.0",
         "rc-util": "^5.8.0"
       }
     },
     "rc-image": {
-      "version": "5.6.2",
+      "version": "5.7.1",
+      "resolved": "https://registry.npmjs.org/rc-image/-/rc-image-5.7.1.tgz",
+      "integrity": "sha512-QyMfdhoUfb5W14plqXSisaYwpdstcLYnB0MjX5ccIK2rydQM9sDPuekQWu500DDGR2dBaIF5vx9XbWkNFK17Fg==",
       "requires": {
         "@babel/runtime": "^7.11.2",
         "classnames": "^2.2.6",
-        "rc-dialog": "~8.8.0",
+        "rc-dialog": "~8.9.0",
         "rc-util": "^5.0.6"
       }
     },
     "rc-input": {
-      "version": "0.0.1-alpha.7",
+      "version": "0.1.4",
+      "resolved": "https://registry.npmjs.org/rc-input/-/rc-input-0.1.4.tgz",
+      "integrity": "sha512-FqDdNz+fV2dKNgfXzcSLKvC+jEs1709t7nD+WdfjrdSaOcefpgc7BUJYadc3usaING+b7ediMTfKxuJBsEFbXA==",
       "requires": {
         "@babel/runtime": "^7.11.1",
         "classnames": "^2.2.1",
@@ -26269,26 +26446,32 @@
       }
     },
     "rc-input-number": {
-      "version": "7.3.4",
+      "version": "7.3.9",
+      "resolved": "https://registry.npmjs.org/rc-input-number/-/rc-input-number-7.3.9.tgz",
+      "integrity": "sha512-u0+miS+SATdb6DtssYei2JJ1WuZME+nXaG6XGtR8maNyW5uGDytfDu60OTWLQEb0Anv/AcCzehldV8CKmKyQfA==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.5",
-        "rc-util": "^5.9.8"
+        "rc-util": "^5.23.0"
       }
     },
     "rc-mentions": {
-      "version": "1.7.1",
+      "version": "1.10.0",
+      "resolved": "https://registry.npmjs.org/rc-mentions/-/rc-mentions-1.10.0.tgz",
+      "integrity": "sha512-oMlYWnwXSxP2NQVlgxOTzuG/u9BUc3ySY78K3/t7MNhJWpZzXTao+/Bic6tyZLuNCO89//hVQJBdaR2rnFQl6Q==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
-        "rc-menu": "~9.5.1",
-        "rc-textarea": "^0.3.0",
+        "rc-menu": "~9.6.0",
+        "rc-textarea": "^0.4.0",
         "rc-trigger": "^5.0.4",
-        "rc-util": "^5.0.1"
+        "rc-util": "^5.22.5"
       }
     },
     "rc-menu": {
-      "version": "9.5.5",
+      "version": "9.6.4",
+      "resolved": "https://registry.npmjs.org/rc-menu/-/rc-menu-9.6.4.tgz",
+      "integrity": "sha512-6DiNAjxjVIPLZXHffXxxcyE15d4isRL7iQ1ru4MqYDH2Cqc5bW96wZOdMydFtGLyDdnmEQ9jVvdCE9yliGvzkw==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
@@ -26300,7 +26483,9 @@
       }
     },
     "rc-motion": {
-      "version": "2.6.0",
+      "version": "2.6.2",
+      "resolved": "https://registry.npmjs.org/rc-motion/-/rc-motion-2.6.2.tgz",
+      "integrity": "sha512-4w1FaX3dtV749P8GwfS4fYnFG4Rb9pxvCYPc/b2fw1cmlHJWNNgOFIz7ysiD+eOrzJSvnLJWlNQQncpNMXwwpg==",
       "requires": {
         "@babel/runtime": "^7.11.1",
         "classnames": "^2.2.1",
@@ -26317,7 +26502,9 @@
       }
     },
     "rc-overflow": {
-      "version": "1.2.5",
+      "version": "1.2.8",
+      "resolved": "https://registry.npmjs.org/rc-overflow/-/rc-overflow-1.2.8.tgz",
+      "integrity": "sha512-QJ0UItckWPQ37ZL1dMEBAdY1dhfTXFL9k6oTTcyydVwoUNMnMqCGqnRNA98axSr/OeDKqR6DVFyi8eA5RQI/uQ==",
       "requires": {
         "@babel/runtime": "^7.11.1",
         "classnames": "^2.2.1",
@@ -26326,14 +26513,18 @@
       }
     },
     "rc-pagination": {
-      "version": "3.1.16",
+      "version": "3.1.17",
+      "resolved": "https://registry.npmjs.org/rc-pagination/-/rc-pagination-3.1.17.tgz",
+      "integrity": "sha512-/BQ5UxcBnW28vFAcP2hfh+Xg15W0QZn8TWYwdCApchMH1H0CxiaUUcULP8uXcFM1TygcdKWdt3JqsL9cTAfdkQ==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1"
       }
     },
     "rc-picker": {
-      "version": "2.6.8",
+      "version": "2.6.11",
+      "resolved": "https://registry.npmjs.org/rc-picker/-/rc-picker-2.6.11.tgz",
+      "integrity": "sha512-INJ7ULu+Kj4UgqbcqE8Q+QpMw55xFf9kkyLBHJFk0ihjJpAV4glialRfqHE7k4KX2BWYPQfpILwhwR14x2EiRQ==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1",
@@ -26346,7 +26537,9 @@
       }
     },
     "rc-progress": {
-      "version": "3.2.4",
+      "version": "3.3.3",
+      "resolved": "https://registry.npmjs.org/rc-progress/-/rc-progress-3.3.3.tgz",
+      "integrity": "sha512-MDVNVHzGanYtRy2KKraEaWeZLri2ZHWIRyaE1a9MQ2MuJ09m+Wxj5cfcaoaR6z5iRpHpA59YeUxAlpML8N4PJw==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.6",
@@ -26363,6 +26556,8 @@
     },
     "rc-resize-observer": {
       "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/rc-resize-observer/-/rc-resize-observer-1.2.0.tgz",
+      "integrity": "sha512-6W+UzT3PyDM0wVCEHfoW3qTHPTvbdSgiA43buiy8PzmeMnfgnDeb9NjdimMXMl3/TcrvvWl5RRVdp+NqcR47pQ==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1",
@@ -26380,7 +26575,9 @@
       }
     },
     "rc-select": {
-      "version": "14.1.2",
+      "version": "14.1.13",
+      "resolved": "https://registry.npmjs.org/rc-select/-/rc-select-14.1.13.tgz",
+      "integrity": "sha512-WMEsC3gTwA1dbzWOdVIXDmWyidYNLq68AwvvUlRROw790uGUly0/vmqDozXrIr0QvN/A3CEULx12o+WtLCAefg==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
@@ -26418,67 +26615,83 @@
       }
     },
     "rc-table": {
-      "version": "7.24.1",
+      "version": "7.26.0",
+      "resolved": "https://registry.npmjs.org/rc-table/-/rc-table-7.26.0.tgz",
+      "integrity": "sha512-0cD8e6S+DTGAt5nBZQIPFYEaIukn17sfa5uFL98faHlH/whZzD8ii3dbFL4wmUDEL4BLybhYop+QUfZJ4CPvNQ==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.5",
         "rc-resize-observer": "^1.1.0",
-        "rc-util": "^5.14.0",
+        "rc-util": "^5.22.5",
         "shallowequal": "^1.1.0"
       }
     },
     "rc-tabs": {
-      "version": "11.13.0",
+      "version": "12.2.1",
+      "resolved": "https://registry.npmjs.org/rc-tabs/-/rc-tabs-12.2.1.tgz",
+      "integrity": "sha512-09pVv4kN8VFqp6THceEmxOW8PAShQC08hrroeVYP4Y8YBFaP1PIWdyFL01czcbyz5YZFj9flZ7aljMaAl0jLVg==",
       "requires": {
         "@babel/runtime": "^7.11.2",
         "classnames": "2.x",
-        "rc-dropdown": "~3.5.0",
-        "rc-menu": "~9.5.1",
+        "rc-dropdown": "~4.0.0",
+        "rc-menu": "~9.6.0",
+        "rc-motion": "^2.6.2",
         "rc-resize-observer": "^1.0.0",
         "rc-util": "^5.5.0"
       }
     },
     "rc-textarea": {
-      "version": "0.3.7",
+      "version": "0.4.6",
+      "resolved": "https://registry.npmjs.org/rc-textarea/-/rc-textarea-0.4.6.tgz",
+      "integrity": "sha512-HEKCu8nouXXayqYelQnhQm8fdH7v92pAQvfVCz+jhIPv2PHTyBxVrmoZJMn3B8cU+wdyuvRGkshngO3/TzBn4w==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "^2.2.1",
         "rc-resize-observer": "^1.0.0",
-        "rc-util": "^5.7.0",
+        "rc-util": "^5.24.4",
         "shallowequal": "^1.1.0"
       }
     },
     "rc-tooltip": {
-      "version": "5.1.1",
+      "version": "5.2.2",
+      "resolved": "https://registry.npmjs.org/rc-tooltip/-/rc-tooltip-5.2.2.tgz",
+      "integrity": "sha512-jtQzU/18S6EI3lhSGoDYhPqNpWajMtS5VV/ld1LwyfrDByQpYmw/LW6U7oFXXLukjfDHQ7Ju705A82PRNFWYhg==",
       "requires": {
         "@babel/runtime": "^7.11.2",
+        "classnames": "^2.3.1",
         "rc-trigger": "^5.0.0"
       }
     },
     "rc-tree": {
-      "version": "5.5.0",
+      "version": "5.7.0",
+      "resolved": "https://registry.npmjs.org/rc-tree/-/rc-tree-5.7.0.tgz",
+      "integrity": "sha512-F+Ewkv/UcutshnVBMISP+lPdHDlcsL+YH/MQDVWbk+QdkfID7vXiwrHMEZn31+2Rbbm21z/HPceGS8PXGMmnQg==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
         "rc-motion": "^2.0.1",
         "rc-util": "^5.16.1",
-        "rc-virtual-list": "^3.4.2"
+        "rc-virtual-list": "^3.4.8"
       }
     },
     "rc-tree-select": {
-      "version": "5.3.0",
+      "version": "5.5.3",
+      "resolved": "https://registry.npmjs.org/rc-tree-select/-/rc-tree-select-5.5.3.tgz",
+      "integrity": "sha512-gv8KyC6J7f9e50OkGk1ibF7v8vL+iaBnA8Ep/EVlMma2/tGdBQXO9xIvPjX8eQrZL5PjoeTUndNPM3cY3721ng==",
       "requires": {
         "@babel/runtime": "^7.10.1",
         "classnames": "2.x",
         "rc-select": "~14.1.0",
-        "rc-tree": "~5.5.0",
+        "rc-tree": "~5.7.0",
         "rc-util": "^5.16.1"
       }
     },
     "rc-trigger": {
-      "version": "5.2.18",
+      "version": "5.3.3",
+      "resolved": "https://registry.npmjs.org/rc-trigger/-/rc-trigger-5.3.3.tgz",
+      "integrity": "sha512-IC4nuTSAME7RJSgwvHCNDQrIzhvGMKf6NDu5veX+zk1MG7i1UnwTWWthcP9WHw3+FZfP3oZGvkrHFPu/EGkFKw==",
       "requires": {
-        "@babel/runtime": "^7.11.2",
+        "@babel/runtime": "^7.18.3",
         "classnames": "^2.2.6",
         "rc-align": "^4.0.0",
         "rc-motion": "^2.0.0",
@@ -26494,16 +26707,21 @@
       }
     },
     "rc-util": {
-      "version": "5.21.2",
+      "version": "5.24.4",
+      "resolved": "https://registry.npmjs.org/rc-util/-/rc-util-5.24.4.tgz",
+      "integrity": "sha512-2a4RQnycV9eV7lVZPEJ7QwJRPlZNc06J7CwcwZo4vIHr3PfUqtYgl1EkUV9ETAc6VRRi8XZOMFhYG63whlIC9Q==",
       "requires": {
-        "@babel/runtime": "^7.12.5",
+        "@babel/runtime": "^7.18.3",
         "react-is": "^16.12.0",
         "shallowequal": "^1.1.0"
       }
     },
     "rc-virtual-list": {
-      "version": "3.4.7",
+      "version": "3.4.11",
+      "resolved": "https://registry.npmjs.org/rc-virtual-list/-/rc-virtual-list-3.4.11.tgz",
+      "integrity": "sha512-BvUUH60kkeTBPigN5F89HtGaA5jSP4y2aM6cJ4dk9Y42I9yY+h6i08wF6UKeDcxdfOU8j3I5HxkSS/xA77J3wA==",
       "requires": {
+        "@babel/runtime": "^7.20.0",
         "classnames": "^2.2.6",
         "rc-resize-observer": "^1.0.0",
         "rc-util": "^5.15.0"
@@ -26639,6 +26857,15 @@
       "version": "0.11.0",
       "dev": true
     },
+    "react-resizable": {
+      "version": "3.0.4",
+      "resolved": "https://registry.npmjs.org/react-resizable/-/react-resizable-3.0.4.tgz",
+      "integrity": "sha512-StnwmiESiamNzdRHbSSvA65b0ZQJ7eVQpPusrSmcpyGKzC0gojhtO62xxH6YOBmepk9dQTBi9yxidL3W4s3EBA==",
+      "requires": {
+        "prop-types": "15.x",
+        "react-draggable": "^4.0.3"
+      }
+    },
     "react-router": {
       "version": "6.3.0",
       "requires": {
@@ -26764,7 +26991,9 @@
       }
     },
     "regenerator-runtime": {
-      "version": "0.13.9"
+      "version": "0.13.10",
+      "resolved": "https://registry.npmjs.org/regenerator-runtime/-/regenerator-runtime-0.13.10.tgz",
+      "integrity": "sha512-KepLsg4dU12hryUO7bp/axHAKvwGOCV0sGloQtpagJ12ai+ojVDqkeGSiRX1zlq+kjIMZ1t7gpze+26QqtdGqw=="
     },
     "regenerator-transform": {
       "version": "0.15.0",
@@ -27432,7 +27661,9 @@
       "dev": true
     },
     "string-convert": {
-      "version": "0.2.1"
+      "version": "0.2.1",
+      "resolved": "https://registry.npmjs.org/string-convert/-/string-convert-0.2.1.tgz",
+      "integrity": "sha512-u/1tdPl4yQnPBjnVrmdLo9gtuLvELKsAoRapekWggdiQNvvvum+jYF329d84NAa660KQw7pB2n36KrIKVoXa3A=="
     },
     "string-length": {
       "version": "4.0.2",
@@ -28057,6 +28288,43 @@
       "version": "1.1.2",
       "dev": true
     },
+    "vscode-json-languageservice": {
+      "version": "4.2.1",
+      "resolved": "https://registry.npmjs.org/vscode-json-languageservice/-/vscode-json-languageservice-4.2.1.tgz",
+      "integrity": "sha512-xGmv9QIWs2H8obGbWg+sIPI/3/pFgj/5OWBhNzs00BkYQ9UaB2F6JJaGB/2/YOZJ3BvLXQTC4Q7muqU25QgAhA==",
+      "dev": true,
+      "requires": {
+        "jsonc-parser": "^3.0.0",
+        "vscode-languageserver-textdocument": "^1.0.3",
+        "vscode-languageserver-types": "^3.16.0",
+        "vscode-nls": "^5.0.0",
+        "vscode-uri": "^3.0.3"
+      }
+    },
+    "vscode-languageserver-textdocument": {
+      "version": "1.0.7",
+      "resolved": "https://registry.npmjs.org/vscode-languageserver-textdocument/-/vscode-languageserver-textdocument-1.0.7.tgz",
+      "integrity": "sha512-bFJH7UQxlXT8kKeyiyu41r22jCZXG8kuuVVA33OEJn1diWOZK5n8zBSPZFHVBOu8kXZ6h0LIRhf5UnCo61J4Hg==",
+      "dev": true
+    },
+    "vscode-languageserver-types": {
+      "version": "3.17.2",
+      "resolved": "https://registry.npmjs.org/vscode-languageserver-types/-/vscode-languageserver-types-3.17.2.tgz",
+      "integrity": "sha512-zHhCWatviizPIq9B7Vh9uvrH6x3sK8itC84HkamnBWoDFJtzBf7SWlpLCZUit72b3os45h6RWQNC9xHRDF8dRA==",
+      "dev": true
+    },
+    "vscode-nls": {
+      "version": "5.2.0",
+      "resolved": "https://registry.npmjs.org/vscode-nls/-/vscode-nls-5.2.0.tgz",
+      "integrity": "sha512-RAaHx7B14ZU04EU31pT+rKz2/zSl7xMsfIZuo8pd+KZO6PXtQmpevpq3vxvWNcrGbdmhM/rr5Uw5Mz+NBfhVng==",
+      "dev": true
+    },
+    "vscode-uri": {
+      "version": "3.0.6",
+      "resolved": "https://registry.npmjs.org/vscode-uri/-/vscode-uri-3.0.6.tgz",
+      "integrity": "sha512-fmL7V1eiDBFRRnu+gfRWTzyPpNIHJTc4mWnFkwBUmO9U3KPgJAmTx7oxi2bl/Rh6HLdU7+4C9wlj0k2E4AdKFQ==",
+      "dev": true
+    },
     "w3c-hr-time": {
       "version": "1.0.2",
       "dev": true,
diff --git a/ui/package.json b/ui/package.json
index 0cd3f6b7e..da870fbf3 100644
--- a/ui/package.json
+++ b/ui/package.json
@@ -6,7 +6,7 @@
     "@ant-design/icons": "^4.7.0",
     "@azure/msal-browser": "^2.24.0",
     "@azure/msal-react": "^1.4.0",
-    "antd": "^4.20.2",
+    "antd": "^4.23.6",
     "axios": "^0.27.2",
     "classnames": "^2.3.2",
     "dagre": "^0.8.5",
@@ -15,6 +15,7 @@
     "react-dom": "^17.0.2",
     "react-flow-renderer": "^9.7.4",
     "react-query": "^3.38.0",
+    "react-resizable": "^3.0.4",
     "react-router-dom": "^6.3.0"
   },
   "devDependencies": {
@@ -27,6 +28,7 @@
     "@types/node": "^16.11.26",
     "@types/react": "^17.0.43",
     "@types/react-dom": "^17.0.14",
+    "@types/react-resizable": "^3.0.3",
     "@typescript-eslint/eslint-plugin": "^5.30.7",
     "@typescript-eslint/parser": "^5.30.7",
     "babel-plugin-import": "^1.13.5",
@@ -35,6 +37,7 @@
     "eslint-config-prettier": "^8.5.0",
     "eslint-import-resolver-typescript": "^3.5.1",
     "eslint-plugin-import": "^2.26.0",
+    "eslint-plugin-json": "^3.1.0",
     "eslint-plugin-prettier": "^4.2.1",
     "eslint-plugin-react-hooks": "^4.6.0",
     "husky": "^8.0.1",
@@ -51,7 +54,8 @@
     "test": "craco test",
     "eject": "react-scripts eject",
     "lint:fix": "npx eslint --fix --ext ts --ext tsx  src/ ",
-    "format": "npx prettier --write src/**"
+    "format": "npx prettier --write src/**",
+    "lintStaged": "lint-staged"
   },
   "browserslist": {
     "production": [
diff --git a/ui/src/api/api.tsx b/ui/src/api/api.tsx
index a95ab2bd5..6c8b6f665 100644
--- a/ui/src/api/api.tsx
+++ b/ui/src/api/api.tsx
@@ -38,14 +38,18 @@ export const fetchDataSource = async (
 ) => {
   const axios = await authAxios(msalInstance);
   return axios
-    .get<DataSource>(
+    .get<DataSource & { message: string; detail: string }>(
       `${getApiBaseUrl()}/projects/${project}/datasources/${dataSourceId}`,
       {
         params: { project: project, datasource: dataSourceId },
       }
     )
     .then((response) => {
-      return response.data;
+      if (response.data.message || response.data.detail) {
+        return Promise.reject(response.data.message || response.data.detail);
+      } else {
+        return response.data;
+      }
     });
 };
 
@@ -109,33 +113,21 @@ export const fetchFeatureLineages = async (featureId: string) => {
 // Following are place-holder code
 export const createFeature = async (feature: Feature) => {
   const axios = await authAxios(msalInstance);
-  return axios
-    .post(`${getApiBaseUrl()}/features`, feature, {
-      headers: { "Content-Type": "application/json;" },
-      params: {},
-    })
-    .then((response) => {
-      return response;
-    })
-    .catch((error) => {
-      return error.response;
-    });
+  return axios.post(`${getApiBaseUrl()}/features`, feature, {
+    headers: { "Content-Type": "application/json;" },
+    params: {},
+  });
 };
 
-export const updateFeature = async (feature: Feature, id: string) => {
+export const updateFeature = async (feature: Feature, id?: string) => {
   const axios = await authAxios(msalInstance);
-  feature.guid = id;
-  return await axios
-    .put(`${getApiBaseUrl()}/features/${id}`, feature, {
-      headers: { "Content-Type": "application/json;" },
-      params: {},
-    })
-    .then((response) => {
-      return response;
-    })
-    .catch((error) => {
-      return error.response;
-    });
+  if (id) {
+    feature.guid = id;
+  }
+  return axios.put(`${getApiBaseUrl()}/features/${feature.guid}`, feature, {
+    headers: { "Content-Type": "application/json;" },
+    params: {},
+  });
 };
 
 export const listUserRole = async () => {
@@ -245,6 +237,8 @@ export const authAxios = async (msalInstance: PublicClientApplication) => {
       if (error.response?.status === 403) {
         const detail = error.response.data.detail;
         window.location.href = "/responseErrors/403/" + detail;
+      } else {
+        return Promise.reject(error.response.data);
       }
       //TODO: handle other response errors
     }
diff --git a/ui/src/components/CardDescriptions/index.tsx b/ui/src/components/CardDescriptions/index.tsx
new file mode 100644
index 000000000..9c0d41498
--- /dev/null
+++ b/ui/src/components/CardDescriptions/index.tsx
@@ -0,0 +1,32 @@
+import React from "react";
+import { Card, Descriptions } from "antd";
+
+export interface CardDescriptionsProps {
+  title?: string;
+  mapping: any[];
+  descriptions: any;
+}
+
+const CardDescriptions = (props: CardDescriptionsProps) => {
+  const { title, mapping, descriptions } = props;
+
+  return descriptions ? (
+    <Card className="card" title={title}>
+      <Descriptions column={1}>
+        {mapping.reduce((list: any, item) => {
+          const value = descriptions?.[item.key];
+          if (value) {
+            list.push(
+              <Descriptions.Item key={item.key} label={item.label}>
+                {typeof value === "string" ? value : JSON.stringify(value)}
+              </Descriptions.Item>
+            );
+          }
+          return list;
+        }, [])}
+      </Descriptions>
+    </Card>
+  ) : null;
+};
+
+export default CardDescriptions;
diff --git a/ui/src/components/FlowGraph/FlowGraph.tsx b/ui/src/components/FlowGraph/FlowGraph.tsx
new file mode 100644
index 000000000..ef3f16033
--- /dev/null
+++ b/ui/src/components/FlowGraph/FlowGraph.tsx
@@ -0,0 +1,236 @@
+import React, {
+  MouseEvent as ReactMouseEvent,
+  forwardRef,
+  useCallback,
+  useEffect,
+  useRef,
+  useState,
+} from "react";
+import ReactFlow, {
+  ConnectionLineType,
+  Controls,
+  Edge,
+  Node,
+  Elements,
+  getIncomers,
+  getOutgoers,
+  ReactFlowProvider,
+  isNode,
+  OnLoadParams,
+} from "react-flow-renderer";
+import { Spin } from "antd";
+import { LoadingOutlined } from "@ant-design/icons";
+import { useSearchParams } from "react-router-dom";
+import cs from "classnames";
+import { FeatureLineage } from "@/models/model";
+import { isFeature, FeatureType } from "@/utils/utils";
+import LineageNode from "./LineageNode";
+import { NodeData, FlowGraphProps } from "./interface";
+import { getElements } from "./utils";
+
+import styles from "./index.module.less";
+
+const FlowGraphNodeTypes = {
+  "custom-node": LineageNode,
+};
+
+const defaultProps: FlowGraphProps = {
+  project: "",
+  snapGrid: [15, 15],
+  featureType: FeatureType.AllNodes,
+};
+
+const FlowGraph = (props: FlowGraphProps, ref: any) => {
+  const {
+    className,
+    style,
+    data,
+    loading,
+    height,
+    minHeight,
+    project,
+    nodeId,
+    featureType,
+    snapGrid,
+  } = {
+    ...defaultProps,
+    ...props,
+  };
+  const [, setURLSearchParams] = useSearchParams();
+  const flowRef = useRef<OnLoadParams>();
+  const hasReadRef = useRef<boolean>(false);
+  const elementRef = useRef<Elements<NodeData | any>>();
+  const hasHighlight = useRef<boolean>(false);
+  const [elements, setElements] = useState<Elements<NodeData | any>>([]);
+
+  // Reset all node highlight status
+  const resetHighlight = useCallback(() => {
+    if (
+      elementRef.current &&
+      elementRef.current.length > 0 &&
+      hasHighlight.current
+    ) {
+      hasHighlight.current = false;
+      setElements((state) => {
+        return state.map((element) => {
+          if (isNode(element)) {
+            element.style = {
+              ...element.style,
+              opacity: 1,
+            };
+            element.data!.active = false;
+          } else {
+            element.animated = false;
+          }
+          return element;
+        });
+      });
+    }
+  }, [setElements]);
+
+  // Highlight path of selected node, including all linked up and down stream nodes
+  const highlightPath = useCallback(
+    (node: Node<NodeData>) => {
+      if (elementRef.current && elementRef.current.length > 0) {
+        hasHighlight.current = true;
+        setElements((elements) => {
+          const incomerIds = new Set(
+            getIncomers(node, elements).map((item) => item.id)
+          );
+          const outgoerIds = new Set(
+            getOutgoers(node, elements).map((item) => item.id)
+          );
+
+          return elements.map((element) => {
+            if (isNode(element)) {
+              const highlight =
+                element.id === node.id ||
+                incomerIds.has(element.id) ||
+                outgoerIds.has(element.id);
+              element.style = {
+                ...element.style,
+                opacity: highlight ? 1 : 0.25,
+              };
+              element.data = {
+                ...element.data,
+                active:
+                  element.id === node.id && isFeature(element.data!.subtitle),
+              };
+            } else {
+              const highlight =
+                element.source === node.id || element.target === node.id;
+              const animated =
+                incomerIds.has(element.source) &&
+                (incomerIds.has(element.target) || node.id === element.target);
+
+              element.animated = highlight || animated;
+            }
+            return element;
+          });
+        });
+      }
+    },
+    [setElements]
+  );
+
+  // Fired when panel is clicked, reset all highlighted path, and remove the nodeId query string in url path.
+  const onPaneClick = useCallback(() => {
+    resetHighlight();
+    setURLSearchParams({});
+  }, [resetHighlight, setURLSearchParams]);
+
+  const onElementClick = useCallback(
+    (e: ReactMouseEvent, element: Node<NodeData> | Edge) => {
+      e.stopPropagation();
+      if (isNode(element)) {
+        setURLSearchParams({
+          nodeId: element.id,
+          featureType: element.data!.subtitle,
+        });
+        setTimeout(() => {
+          highlightPath(element);
+        }, 0);
+      }
+    },
+    [highlightPath, setURLSearchParams]
+  );
+
+  const handleInit = useCallback(
+    (
+      project: string,
+      data: FeatureLineage,
+      featureType?: FeatureType,
+      nodeId?: string
+    ) => {
+      const elements = (elementRef.current = getElements(
+        project,
+        data,
+        featureType
+      ));
+      setElements(elements);
+      if (nodeId) {
+        const node = elements?.find(
+          (item) => item.id === nodeId
+        ) as Node<NodeData>;
+        if (node) {
+          highlightPath(node);
+        }
+      }
+    },
+    [setElements, highlightPath]
+  );
+
+  // Fit the graph to the center of layout view when graph is initialized
+  const onLoad = (reactFlowInstance: OnLoadParams) => {
+    flowRef.current = reactFlowInstance;
+    flowRef.current?.fitView();
+  };
+
+  useEffect(() => {
+    if (data) {
+      const type = hasHighlight.current ? FeatureType.AllNodes : featureType;
+      handleInit(project!, data, type, nodeId);
+    }
+  }, [data, project, nodeId, featureType, handleInit]);
+
+  useEffect(() => {
+    if (elements.length > 0 && !hasReadRef.current) {
+      hasReadRef.current = true;
+      setTimeout(() => {
+        flowRef.current?.fitView();
+      }, 0);
+    }
+  }, [elements]);
+
+  return (
+    <Spin
+      spinning={loading}
+      indicator={<LoadingOutlined style={{ fontSize: 48 }} spin />}
+    >
+      <ReactFlowProvider>
+        <ReactFlow
+          className={cs(styles.flowGraph, className)}
+          style={{ ...style, height, minHeight }}
+          elements={elements}
+          snapToGrid
+          snapGrid={snapGrid}
+          zoomOnScroll={false}
+          preventScrolling={false}
+          nodeTypes={FlowGraphNodeTypes}
+          onLoad={onLoad}
+          connectionLineType={ConnectionLineType.SmoothStep}
+          onPaneClick={onPaneClick}
+          onElementClick={onElementClick}
+        >
+          <Controls />
+        </ReactFlow>
+      </ReactFlowProvider>
+    </Spin>
+  );
+};
+
+const FlowGraphComponent = forwardRef<unknown, FlowGraphProps>(FlowGraph);
+
+FlowGraphComponent.displayName = "FlowGraph";
+
+export default FlowGraphComponent;
diff --git a/ui/src/components/FlowGraph/LineageNode.tsx b/ui/src/components/FlowGraph/LineageNode.tsx
new file mode 100644
index 000000000..27a99cc4f
--- /dev/null
+++ b/ui/src/components/FlowGraph/LineageNode.tsx
@@ -0,0 +1,57 @@
+import React, { forwardRef, memo } from "react";
+import cs from "classnames";
+import { RightCircleOutlined } from "@ant-design/icons";
+import { useNavigate } from "react-router-dom";
+import { Handle, NodeProps, Position } from "react-flow-renderer";
+import { LineageNodeProps } from "./interface";
+
+import styles from "./index.module.less";
+
+const LineageNode = (props: LineageNodeProps, ref: any) => {
+  const navigate = useNavigate();
+
+  const { label, subtitle, version, borderColor, detialUrl, active } =
+    props.data;
+
+  const nodeTitle = version ? `${label} (v${version})` : label;
+  const nodeSubtitle = subtitle.replace("feathr_", "");
+  const nodeColorStyle = {
+    border: `2px solid ${borderColor}`,
+  };
+
+  const onNodeIconClick = () => {
+    if (detialUrl) {
+      navigate(detialUrl);
+    }
+    //  `/projects/${project}/features/${featureId}`);
+  };
+
+  return (
+    <div
+      ref={ref}
+      style={active ? undefined : nodeColorStyle}
+      className={cs(styles.lineageNode, { [styles.lineageNodeActive]: active })}
+    >
+      <div className={styles.box}>
+        <Handle type="target" position={Position.Left} />
+        <div className={styles.title}>
+          {nodeTitle}
+          {active && (
+            <RightCircleOutlined
+              className={styles.navigate}
+              onClick={onNodeIconClick}
+            />
+          )}
+          <div className={styles.subtitle}>{nodeSubtitle}</div>
+        </div>
+        <Handle type="source" position={Position.Right} />
+      </div>
+    </div>
+  );
+};
+
+const LineageNodeComponent = forwardRef<unknown, NodeProps>(LineageNode);
+
+LineageNodeComponent.displayName = "LineageNode";
+
+export default memo(LineageNodeComponent);
diff --git a/ui/src/components/FlowGraph/index.module.less b/ui/src/components/FlowGraph/index.module.less
new file mode 100644
index 000000000..9e69f59d7
--- /dev/null
+++ b/ui/src/components/FlowGraph/index.module.less
@@ -0,0 +1,43 @@
+.flowGraph {
+  width: 100%;
+}
+
+.lineageNode {
+  height: 100%;
+
+  &Active {
+    overflow: hidden;
+    border-radius: 0.25rem;
+    border-width: 2px;
+    border-style: solid;
+    --tw-border-opacity: 1;
+    border-color: rgba(57, 35, 150, var(--tw-border-opacity));
+    --tw-bg-opacity: 1;
+    background-color: rgba(57, 35, 150, var(--tw-bg-opacity));
+    --tw-text-opacity: 1;
+    color: rgba(255, 255, 255, var(--tw-text-opacity));
+    opacity: 1;
+  }
+
+  .box {
+    padding: 4px 12px 7px;
+  }
+
+  .title {
+    font-size: 15px;
+    font-weight: 700;
+  }
+
+  .subtitle {
+    font-size: 10px;
+    font-style: italic;
+    text-overflow: ellipsis;
+    max-width: 135px;
+    overflow: hidden;
+    white-space: nowrap;
+  }
+
+  .navigate {
+    padding: 4px 12px 7px;
+  }
+}
diff --git a/ui/src/components/FlowGraph/index.ts b/ui/src/components/FlowGraph/index.ts
new file mode 100644
index 000000000..0f6d659d8
--- /dev/null
+++ b/ui/src/components/FlowGraph/index.ts
@@ -0,0 +1,5 @@
+import FlowGraph from "./FlowGraph";
+
+export * from "./interface";
+
+export default FlowGraph;
diff --git a/ui/src/components/FlowGraph/interface.ts b/ui/src/components/FlowGraph/interface.ts
new file mode 100644
index 000000000..0949dbe97
--- /dev/null
+++ b/ui/src/components/FlowGraph/interface.ts
@@ -0,0 +1,30 @@
+import { CSSProperties } from "react";
+import { FeatureLineage } from "@/models/model";
+import { FeatureType } from "@/utils/utils";
+import { NodeProps, ReactFlowProps } from "react-flow-renderer";
+
+export interface NodeData {
+  id: string;
+  label: string;
+  subtitle: string;
+  featureId: string;
+  version: string;
+  borderColor?: string;
+  active?: boolean;
+  detialUrl?: string;
+}
+
+export interface FlowGraphProps {
+  className?: string;
+  style?: CSSProperties;
+  minHeight?: string | number;
+  height?: string | number;
+  loading?: boolean;
+  data?: FeatureLineage;
+  nodeId?: string;
+  project?: string;
+  snapGrid?: ReactFlowProps["snapGrid"];
+  featureType?: FeatureType;
+}
+
+export interface LineageNodeProps extends NodeProps<NodeData> {}
diff --git a/ui/src/components/FlowGraph/utils.ts b/ui/src/components/FlowGraph/utils.ts
new file mode 100644
index 000000000..141962895
--- /dev/null
+++ b/ui/src/components/FlowGraph/utils.ts
@@ -0,0 +1,192 @@
+import { Feature, FeatureLineage, RelationData } from "@/models/model";
+import { FeatureType, getFeatureDetailUrl } from "@/utils/utils";
+import dagre from "dagre";
+import {
+  Node,
+  Edge,
+  ArrowHeadType,
+  Position,
+  Elements,
+} from "react-flow-renderer";
+import { NodeData } from "./interface";
+
+const featureTypeColors: Record<string, string> = {
+  feathr_source_v1: "hsl(315, 100%, 50%)",
+  feathr_anchor_v1: "hsl(270, 100%, 50%)",
+  feathr_anchor_feature_v1: "hsl(225, 100%, 50%)",
+  feathr_derived_feature_v1: "hsl(135, 100%, 50%)",
+};
+
+const DEFAULT_WIDTH = 20;
+const DEFAULT_HEIGHT = 36;
+
+const generateNode = (project: string, data: Feature): Node<NodeData> => {
+  return {
+    id: data.guid,
+    type: "custom-node",
+    style: {
+      border: `2px solid featureTypeColors[data.typeName]`,
+    },
+    position: {
+      x: 0,
+      y: 0,
+    },
+    data: {
+      id: data.guid,
+      label: data.displayText,
+      subtitle: data.typeName,
+      featureId: data.guid,
+      version: data.version,
+      borderColor: featureTypeColors[data.typeName],
+      detialUrl: getFeatureDetailUrl(project, data),
+    },
+  };
+};
+
+const generateEdge = (
+  data: RelationData,
+  entityMap: Record<string, Feature>
+): Edge => {
+  let { fromEntityId: from, toEntityId: to, relationshipType } = data;
+
+  if (relationshipType === "Consumes") {
+    [from, to] = [to, from];
+  }
+  const sourceNode = entityMap?.[from];
+  const targetNode = entityMap?.[to];
+
+  return {
+    id: `e-${from}_${to}`,
+    source: from,
+    target: to,
+    arrowHeadType: ArrowHeadType.ArrowClosed,
+    data: {
+      sourceTypeName: sourceNode?.typeName,
+      targetTypeName: targetNode?.typeName,
+    },
+  };
+};
+
+export const getLineageNodes = (
+  project: string,
+  lineageData: FeatureLineage,
+  featureType: FeatureType
+): Node<NodeData>[] => {
+  const { guidEntityMap } = lineageData;
+  if (!guidEntityMap) {
+    return [];
+  }
+
+  return Object.values(guidEntityMap).reduce(
+    (nodes: Node<NodeData>[], item: Feature) => {
+      if (
+        item.typeName !== "feathr_workspace_v1" &&
+        (featureType === FeatureType.AllNodes ||
+          item.typeName === featureType ||
+          (featureType === FeatureType.AnchorFeature &&
+            item.typeName === FeatureType.Anchor))
+      ) {
+        nodes.push(generateNode(project, item));
+      }
+      return nodes;
+    },
+    [] as Node<NodeData>[]
+  );
+};
+
+export const getLineageEdge = (
+  lineageData: FeatureLineage,
+  featureType: FeatureType
+): Edge[] => {
+  if (!lineageData.relations || !lineageData.guidEntityMap) {
+    return [];
+  }
+
+  return lineageData.relations.reduce((edges: Edge[], item) => {
+    if (["Consumes", "Contains", "Produces"].includes(item.relationshipType)) {
+      const edge = generateEdge(item, lineageData.guidEntityMap!);
+      if (
+        edges.findIndex((item) => item.id === edge.id) === -1 &&
+        edge.data.sourceTypeName !== "feathr_workspace_v1" &&
+        (featureType === FeatureType.AllNodes ||
+          (featureType === FeatureType.AnchorFeature &&
+            edge.data.sourceTypeName === FeatureType.Anchor &&
+            edge.data.targetTypeName === FeatureType.AnchorFeature))
+      ) {
+        edges.push(edge);
+      }
+    }
+
+    return edges;
+  }, [] as Edge[]);
+};
+
+export const getElements = (
+  project: string,
+  lineageData: FeatureLineage,
+  featureType: FeatureType = FeatureType.AllNodes,
+  direction = "LR"
+) => {
+  const elements: Elements<NodeData | any> = [];
+
+  const dagreGraph = new dagre.graphlib.Graph({ compound: true });
+
+  dagreGraph.setDefaultEdgeLabel(() => ({}));
+  dagreGraph.setGraph({ rankdir: direction });
+
+  const isHorizontal = direction === "LR";
+
+  const nodes = getLineageNodes(project, lineageData, featureType);
+  let edges = getLineageEdge(lineageData, featureType);
+
+  const anchorEdges = edges.filter((item) => {
+    return (
+      item.data.sourceTypeName === FeatureType.Anchor &&
+      item.data.targetTypeName === FeatureType.AnchorFeature
+    );
+  });
+
+  edges = edges.reduce((data: any, item) => {
+    const anchorEdge = anchorEdges.find((i: any) => i.target === item.target);
+    if (anchorEdge) {
+      if (
+        !(
+          item.data.sourceTypeName === FeatureType.Source &&
+          item.data.targetTypeName === FeatureType.AnchorFeature
+        )
+      ) {
+        data.push(item);
+      }
+    } else {
+      data.push(item);
+    }
+    return data;
+  }, []);
+
+  nodes.forEach((item) => {
+    dagreGraph.setNode(item.id, {
+      label: item.data!.label,
+      node: item,
+      width: item.data!.label.length * 8 + DEFAULT_WIDTH,
+      height: item.style?.height || DEFAULT_HEIGHT,
+    });
+    elements.push(item);
+  });
+
+  edges?.forEach((item: any) => {
+    dagreGraph.setEdge(item.source, item.target);
+    elements.push(item);
+  });
+
+  dagre.layout(dagreGraph);
+
+  nodes.forEach((item) => {
+    const nodeWithPosition = dagreGraph.node(item.id);
+    item.targetPosition = isHorizontal ? Position.Left : Position.Top;
+    item.sourcePosition = isHorizontal ? Position.Right : Position.Bottom;
+    item.position.x = nodeWithPosition.x;
+    item.position.y = nodeWithPosition.y - DEFAULT_HEIGHT / 2;
+  });
+
+  return elements;
+};
diff --git a/ui/src/components/ProjectsSelect/index.tsx b/ui/src/components/ProjectsSelect/index.tsx
new file mode 100644
index 000000000..ca5fddf9f
--- /dev/null
+++ b/ui/src/components/ProjectsSelect/index.tsx
@@ -0,0 +1,51 @@
+import React from "react";
+import { Select } from "antd";
+import { fetchProjects } from "@/api";
+import { useQuery } from "react-query";
+
+export interface ProjectsSelectProps {
+  width?: number;
+  defaultValue?: string;
+  onChange?: (value: string) => void;
+}
+
+const ProjectsSelect = (props: ProjectsSelectProps) => {
+  const { width = 350, defaultValue, onChange, ...restProps } = props;
+
+  const { isLoading, data: options } = useQuery<
+    { value: string; label: string }[]
+  >(
+    ["projectsSelect"],
+    async () => {
+      try {
+        const result = await fetchProjects();
+        return result.map((item) => ({
+          value: item,
+          label: item,
+        }));
+      } catch (e) {
+        return Promise.reject(e);
+      }
+    },
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
+  );
+
+  return (
+    <Select
+      style={{ width }}
+      showSearch
+      defaultValue={defaultValue}
+      loading={isLoading}
+      placeholder="Project Name"
+      options={options}
+      notFoundContent={"No projects found from server"}
+      onChange={onChange}
+      {...restProps}
+    />
+  );
+};
+
+export default ProjectsSelect;
diff --git a/ui/src/components/ResizeTable/ResizableTitle.tsx b/ui/src/components/ResizeTable/ResizableTitle.tsx
new file mode 100644
index 000000000..863db673f
--- /dev/null
+++ b/ui/src/components/ResizeTable/ResizableTitle.tsx
@@ -0,0 +1,37 @@
+import React from "react";
+import { Resizable } from "react-resizable";
+import ResizeHandle from "./ResizeHandle";
+import { ResizableTitleProps } from "./interface";
+
+import styles from "./index.module.less";
+
+const ResizableTitle = (props: ResizableTitleProps) => {
+  const { onResize, width, minWidth, ...restProps } = props;
+
+  if (!width) {
+    return <th {...restProps} />;
+  }
+
+  return (
+    <Resizable
+      width={width}
+      height={0}
+      handle={<ResizeHandle />}
+      onResize={onResize}
+      minConstraints={minWidth ? [minWidth, minWidth] : undefined}
+      onResizeStart={() => {
+        document.body.classList.add(styles.colResize);
+      }}
+      onResizeStop={() => {
+        document.body.classList.remove(styles.colResize);
+      }}
+      draggableOpts={{
+        enableUserSelectHack: false,
+      }}
+    >
+      <th {...restProps} />
+    </Resizable>
+  );
+};
+
+export default ResizableTitle;
diff --git a/ui/src/components/ResizeTable/ResizeHandle.tsx b/ui/src/components/ResizeTable/ResizeHandle.tsx
new file mode 100644
index 000000000..df2baaf0d
--- /dev/null
+++ b/ui/src/components/ResizeTable/ResizeHandle.tsx
@@ -0,0 +1,29 @@
+import React, { forwardRef, LegacyRef } from "react";
+
+import { ResizeHandleProps } from "./interface";
+
+const ResizeHandle = (
+  props: ResizeHandleProps,
+  ref: LegacyRef<HTMLSpanElement>
+) => {
+  const { handleAxis, ...restProps } = props;
+
+  return (
+    <span
+      ref={ref}
+      className={`react-resizable-handle react-resizable-handle-${handleAxis}`}
+      {...restProps}
+      onClick={(e) => {
+        e.stopPropagation();
+      }}
+    />
+  );
+};
+
+const ResizeHandleComponent = forwardRef<HTMLSpanElement, ResizeHandleProps>(
+  ResizeHandle
+);
+
+ResizeHandleComponent.displayName = "ResizeHandleComponent";
+
+export default ResizeHandleComponent;
diff --git a/ui/src/components/ResizeTable/ResizeTable.tsx b/ui/src/components/ResizeTable/ResizeTable.tsx
new file mode 100644
index 000000000..d90e9aa6d
--- /dev/null
+++ b/ui/src/components/ResizeTable/ResizeTable.tsx
@@ -0,0 +1,68 @@
+import React, { useCallback, useMemo, useState } from "react";
+import { Table } from "antd";
+import cs from "classnames";
+import ResizableTitle from "./ResizableTitle";
+import {
+  ResizableTitleProps,
+  ResizeTableProps,
+  ResizeColumnType,
+} from "./interface";
+
+import styles from "./index.module.less";
+
+const ResizeTable = (props: ResizeTableProps<any>) => {
+  const {
+    className,
+    columns: originColumns = [],
+    components: originComponents,
+    ...rest
+  } = props;
+
+  const handleResize = useCallback((index) => {
+    return ((e, { size }) => {
+      setColumns((prevColumns) => {
+        const nextColumns = [...prevColumns!];
+        nextColumns[index] = { ...nextColumns[index], width: size.width };
+        return nextColumns;
+      });
+    }) as ResizableTitleProps["onResize"];
+  }, []);
+
+  const [columns, setColumns] = useState(
+    originColumns?.map((column, index) => {
+      if (column.width && column.resize !== false) {
+        return {
+          ...column,
+          onHeaderCell: (col: ResizeColumnType<any>) => ({
+            width: col.width,
+            minWidth: col.minWidth,
+            onResize: handleResize(index),
+          }),
+        };
+      }
+
+      return column;
+    })
+  );
+
+  const components = useMemo(() => {
+    return {
+      ...originComponents,
+      header: {
+        ...originComponents?.header,
+        cell: ResizableTitle,
+      },
+    };
+  }, [originComponents]);
+
+  return (
+    <Table
+      className={cs(styles.resizableTable, className)}
+      columns={columns}
+      components={components}
+      {...rest}
+    />
+  );
+};
+
+export default ResizeTable;
diff --git a/ui/src/components/ResizeTable/index.module.less b/ui/src/components/ResizeTable/index.module.less
new file mode 100644
index 000000000..1fcde7c27
--- /dev/null
+++ b/ui/src/components/ResizeTable/index.module.less
@@ -0,0 +1,22 @@
+.colResize {
+  cursor: col-resize;
+  user-select: none;
+}
+
+.resizableTable {
+  :global {
+    .react-resizable {
+      position: relative;
+      background-clip: padding-box;
+    }
+    .react-resizable-handle {
+      position: absolute;
+      width: 10px;
+      height: 100%;
+      bottom: 0;
+      right: -5px;
+      cursor: col-resize;
+      z-index: 1;
+    }
+  }
+}
diff --git a/ui/src/components/ResizeTable/index.tsx b/ui/src/components/ResizeTable/index.tsx
new file mode 100644
index 000000000..26b5e7f18
--- /dev/null
+++ b/ui/src/components/ResizeTable/index.tsx
@@ -0,0 +1,5 @@
+import ResizeTable from "./ResizeTable";
+
+export * from "./interface";
+
+export default ResizeTable;
diff --git a/ui/src/components/ResizeTable/interface.ts b/ui/src/components/ResizeTable/interface.ts
new file mode 100644
index 000000000..c8535ecaf
--- /dev/null
+++ b/ui/src/components/ResizeTable/interface.ts
@@ -0,0 +1,22 @@
+import { TableProps } from "antd";
+import type { ColumnType } from "antd/es/table";
+import { ResizeHandle, ResizableProps } from "react-resizable";
+
+export interface ResizeTableProps<T> extends Omit<TableProps<T>, "columns"> {
+  columns?: ResizeColumnType<T>[];
+}
+
+export interface ResizeColumnType<T> extends ColumnType<T> {
+  resize?: boolean;
+  minWidth?: number;
+}
+
+export interface ResizableTitleProps {
+  onResize?: ResizableProps["onResize"];
+  width?: ResizableProps["width"];
+  minWidth?: number;
+}
+
+export interface ResizeHandleProps {
+  handleAxis?: ResizeHandle;
+}
diff --git a/ui/src/components/graph/graphNodeDetails.tsx b/ui/src/components/graph/graphNodeDetails.tsx
index 2be5b1ec5..7aa003c6d 100644
--- a/ui/src/components/graph/graphNodeDetails.tsx
+++ b/ui/src/components/graph/graphNodeDetails.tsx
@@ -1,10 +1,10 @@
 import React, { useEffect, useState } from "react";
 import { useParams, useSearchParams } from "react-router-dom";
-import { fetchFeature } from "../../api";
-import { Feature } from "../../models/model";
+import { fetchFeature } from "@/api";
+import { Feature } from "@/models/model";
 import { LoadingOutlined } from "@ant-design/icons";
 import { Card, Spin, Typography } from "antd";
-import { isFeature } from "../../utils/utils";
+import { isFeature } from "@/utils/utils";
 
 const { Title } = Typography;
 
@@ -36,66 +36,57 @@ const GraphNodeDetails = () => {
   }, [featureType, project, nodeId]);
 
   return (
-    <>
-      {loading ? (
-        <Spin indicator={<LoadingOutlined style={{ fontSize: 24 }} spin />} />
-      ) : (
-        <div style={{ margin: "2%" }}>
-          {!feature && (
-            <p>Click on feature node to show metadata and metric details</p>
+    <Spin
+      spinning={loading}
+      indicator={<LoadingOutlined style={{ fontSize: 24 }} spin />}
+    >
+      {!feature && (
+        <p>Click on feature node to show metadata and metric details</p>
+      )}
+      {feature?.attributes.transformation && (
+        <Card title="Transformation">
+          {feature.attributes.transformation.transformExpr && (
+            <p>Expression: {feature.attributes.transformation.transformExpr}</p>
+          )}
+          {feature.attributes.transformation.filter && (
+            <p>Filter {feature.attributes.transformation.filter}</p>
+          )}
+          {feature.attributes.transformation.aggFunc && (
+            <p>Aggregation: {feature.attributes.transformation.aggFunc}</p>
           )}
-          {feature?.attributes.transformation && (
-            <Card>
-              <Title level={4}>Transformation</Title>
-              {feature.attributes.transformation.transformExpr && (
-                <p>
-                  Expression: {feature.attributes.transformation.transformExpr}
-                </p>
-              )}
-              {feature.attributes.transformation.filter && (
-                <p>Filter {feature.attributes.transformation.filter}</p>
-              )}
-              {feature.attributes.transformation.aggFunc && (
-                <p>Aggregation: {feature.attributes.transformation.aggFunc}</p>
-              )}
-              {feature.attributes.transformation.limit && (
-                <p>Limit: {feature.attributes.transformation.limit}</p>
-              )}
-              {feature.attributes.transformation.groupBy && (
-                <p>Group By: {feature.attributes.transformation.groupBy}</p>
-              )}
-              {feature.attributes.transformation.window && (
-                <p>Window: {feature.attributes.transformation.window}</p>
-              )}
-              {feature.attributes.transformation.defExpr && (
-                <p>Expression: {feature.attributes.transformation.defExpr}</p>
-              )}
-            </Card>
+          {feature.attributes.transformation.limit && (
+            <p>Limit: {feature.attributes.transformation.limit}</p>
           )}
-          {feature?.attributes.key && feature.attributes.key.length > 0 && (
-            <Card>
-              <Title level={4}>Entity Key</Title>
-              <p>Full name: {feature.attributes.key[0].fullName}</p>
-              <p>Description: {feature.attributes.key[0].description}</p>
-              <p>Key column: {feature.attributes.key[0].keyColumn}</p>
-              <p>
-                Key column alias: {feature.attributes.key[0].keyColumnAlias}
-              </p>
-              <p>Key column type: {feature.attributes.key[0].keyColumnType}</p>
-            </Card>
+          {feature.attributes.transformation.groupBy && (
+            <p>Group By: {feature.attributes.transformation.groupBy}</p>
           )}
-          {feature?.attributes.type && (
-            <Card>
-              <Title level={4}>Type</Title>
-              <p>Dimension Type: {feature.attributes.type.dimensionType}</p>
-              <p>Tensor Category: {feature.attributes.type.tensorCategory}</p>
-              <p>Type: {feature.attributes.type.type}</p>
-              <p>Value Type: {feature.attributes.type.valType}</p>
-            </Card>
+          {feature.attributes.transformation.window && (
+            <p>Window: {feature.attributes.transformation.window}</p>
           )}
-        </div>
+          {feature.attributes.transformation.defExpr && (
+            <p>Expression: {feature.attributes.transformation.defExpr}</p>
+          )}
+        </Card>
+      )}
+      {feature?.attributes.key && feature.attributes.key.length > 0 && (
+        <Card title="Entity Key">
+          <p>Full name: {feature.attributes.key[0].fullName}</p>
+          <p>Description: {feature.attributes.key[0].description}</p>
+          <p>Key column: {feature.attributes.key[0].keyColumn}</p>
+          <p>Key column alias: {feature.attributes.key[0].keyColumnAlias}</p>
+          <p>Key column type: {feature.attributes.key[0].keyColumnType}</p>
+        </Card>
+      )}
+      {feature?.attributes.type && (
+        <Card title="Type">
+          <Title level={4}>Type</Title>
+          <p>Dimension Type: {feature.attributes.type.dimensionType}</p>
+          <p>Tensor Category: {feature.attributes.type.tensorCategory}</p>
+          <p>Type: {feature.attributes.type.type}</p>
+          <p>Value Type: {feature.attributes.type.valType}</p>
+        </Card>
       )}
-    </>
+    </Spin>
   );
 };
 
diff --git a/ui/src/components/header/headerWidgetMenu.tsx b/ui/src/components/header/headerWidgetMenu.tsx
index ca0bf8e38..4cb7753d8 100644
--- a/ui/src/components/header/headerWidgetMenu.tsx
+++ b/ui/src/components/header/headerWidgetMenu.tsx
@@ -1,6 +1,6 @@
 import React from "react";
 import { LogoutOutlined } from "@ant-design/icons";
-import { Menu } from "antd";
+import { Menu, MenuProps } from "antd";
 import { IPublicClientApplication } from "@azure/msal-browser";
 
 type Props = { instance: IPublicClientApplication };
@@ -9,32 +9,27 @@ const HeaderWidgetMenu = ({ instance }: Props) => {
     {
       key: "logout",
       icon: <LogoutOutlined />,
-      value: "Logout",
-      callback: () => {
-        instance.logoutRedirect().catch((e) => {
-          console.error(e);
-        });
-      },
+      label: "Logout",
     },
   ];
-  // @ts-ignore
-  const onClick = ({ key }) => {
-    const item = menuItems.find((i) => i.key === key);
-    if (item && item.callback) item.callback();
+
+  const logout = () => {
+    instance.logoutRedirect().catch((e) => {
+      console.error(e);
+    });
+  };
+
+  const onClick: MenuProps["onClick"] = ({ key }) => {
+    switch (key) {
+      case "logout":
+        logout();
+        break;
+      default:
+        break;
+    }
   };
-  return (
-    <Menu onClick={onClick} selectedKeys={[]}>
-      {menuItems.map((item) => {
-        const { key, icon, value } = item;
-        return (
-          <Menu.Item key={key}>
-            {icon}
-            <span>{value}</span>
-          </Menu.Item>
-        );
-      })}
-    </Menu>
-  );
+
+  return <Menu onClick={onClick} items={menuItems} />;
 };
 
 export default HeaderWidgetMenu;
diff --git a/ui/src/components/sidemenu/siteMenu.tsx b/ui/src/components/sidemenu/siteMenu.tsx
index 0ea68fd6e..2159ebaac 100644
--- a/ui/src/components/sidemenu/siteMenu.tsx
+++ b/ui/src/components/sidemenu/siteMenu.tsx
@@ -8,16 +8,70 @@ import {
   ProjectOutlined,
   RocketOutlined,
 } from "@ant-design/icons";
-import { Link } from "react-router-dom";
+import { Link, useLocation } from "react-router-dom";
+import { useEffect, useState } from "react";
 
 const { Title } = Typography;
 const { Sider } = Layout;
 
+const menuItems = [
+  {
+    key: "",
+    icon: <HomeOutlined style={{ fontSize: "20px", color: "#e28743" }} />,
+    label: <Link to="/">Home</Link>,
+  },
+  {
+    key: "projects",
+    icon: <ProjectOutlined style={{ fontSize: "20px", color: "#177ddc" }} />,
+    label: <Link to="/projects">Projects</Link>,
+  },
+  {
+    key: "datasources",
+    icon: <DatabaseOutlined style={{ fontSize: "20px", color: "#13a8a8" }} />,
+    label: <Link to="/dataSources">Data Sources</Link>,
+  },
+  {
+    key: "features",
+    icon: <CopyOutlined style={{ fontSize: "20px", color: "#d89614" }} />,
+    label: <Link to="/features">Features</Link>,
+  },
+  {
+    key: "jobs",
+    icon: <RocketOutlined style={{ fontSize: "20px", color: "#642ab5" }} />,
+    label: <Link to="/jobs">Jobs</Link>,
+  },
+  {
+    key: "monitoring",
+    icon: <EyeOutlined style={{ fontSize: "20px", color: "#e84749" }} />,
+    label: <Link to="/monitoring">Monitoring</Link>,
+  },
+];
+
+const enableRBAC = window.environment?.enableRBAC;
+const showManagement = enableRBAC
+  ? enableRBAC
+  : process.env.REACT_APP_ENABLE_RBAC;
+
+if (showManagement !== "true") {
+  menuItems.push({
+    key: "management",
+    icon: <ControlOutlined style={{ fontSize: "20px", color: "#6495ed" }} />,
+    label: <Link to="/management">Management</Link>,
+  });
+}
+
+const getMenuKey = (pathname: string) => {
+  return pathname.split("/")[1].toLocaleLowerCase();
+};
+
 const SideMenu = () => {
-  const enableRBAC = window.environment?.enableRBAC;
-  const showManagement = enableRBAC
-    ? enableRBAC
-    : process.env.REACT_APP_ENABLE_RBAC;
+  const location = useLocation();
+
+  const [current, setcurrent] = useState<string>(getMenuKey(location.pathname));
+
+  useEffect(() => {
+    setcurrent(getMenuKey(location.pathname));
+  }, [location.pathname]);
 
   return (
     <Sider theme="dark">
@@ -35,62 +89,9 @@ const SideMenu = () => {
       <Menu
         theme="dark"
         mode="inline"
-        defaultSelectedKeys={["/"]}
-        defaultOpenKeys={["/"]}
-      >
-        <Menu.Item
-          key="/home"
-          icon={<HomeOutlined style={{ fontSize: "20px", color: "#e28743" }} />}
-        >
-          <Link to="/home">Home</Link>
-        </Menu.Item>
-        <Menu.Item
-          key="/projects"
-          icon={
-            <ProjectOutlined style={{ fontSize: "20px", color: "#177ddc" }} />
-          }
-        >
-          <Link to="/projects">Projects</Link>
-        </Menu.Item>
-        <Menu.Item
-          key="/dataSources"
-          icon={
-            <DatabaseOutlined style={{ fontSize: "20px", color: "#13a8a8" }} />
-          }
-        >
-          <Link to="/dataSources">Data Sources</Link>
-        </Menu.Item>
-        <Menu.Item
-          key="/features"
-          icon={<CopyOutlined style={{ fontSize: "20px", color: "#d89614" }} />}
-        >
-          <Link to="/features">Features</Link>
-        </Menu.Item>
-        <Menu.Item
-          key="/jobs"
-          icon={
-            <RocketOutlined style={{ fontSize: "20px", color: "#642ab5" }} />
-          }
-        >
-          <Link to="/jobs">Jobs</Link>
-        </Menu.Item>
-        <Menu.Item
-          key="/monitoring"
-          icon={<EyeOutlined style={{ fontSize: "20px", color: "#e84749" }} />}
-        >
-          <Link to="/monitoring">Monitoring</Link>
-        </Menu.Item>
-        {showManagement === "true" && (
-          <Menu.Item
-            key="/management"
-            icon={
-              <ControlOutlined style={{ fontSize: "20px", color: "#6495ed" }} />
-            }
-          >
-            <Link to="/management">Management</Link>
-          </Menu.Item>
-        )}
-      </Menu>
+        selectedKeys={[current]}
+        items={menuItems}
+      />
     </Sider>
   );
 };
diff --git a/ui/src/models/model.ts b/ui/src/models/model.ts
index e18387d07..c45d0632f 100644
--- a/ui/src/models/model.ts
+++ b/ui/src/models/model.ts
@@ -80,11 +80,21 @@ export interface DataSourceAttributes {
   tags: string[];
   timestampFormat: string;
   type: string;
+  qualified_name: string;
+  timestamp_format: string;
+  event_timestamp_column: string;
+}
+
+export interface RelationData {
+  fromEntityId: string;
+  relationshipId: string;
+  relationshipType: string;
+  toEntityId: string;
 }
 
 export interface FeatureLineage {
-  guidEntityMap: any;
-  relations: any;
+  guidEntityMap: Record<string, Feature>;
+  relations: RelationData[];
 }
 
 export interface UserRole {
diff --git a/ui/src/pages/dataSource/components/DataSourceTable/index.tsx b/ui/src/pages/dataSource/components/DataSourceTable/index.tsx
new file mode 100644
index 000000000..951bd39fd
--- /dev/null
+++ b/ui/src/pages/dataSource/components/DataSourceTable/index.tsx
@@ -0,0 +1,146 @@
+import React, { forwardRef, useRef } from "react";
+import { Button } from "antd";
+import { useQuery } from "react-query";
+import { useNavigate } from "react-router-dom";
+import { DataSource } from "@/models/model";
+import { fetchDataSources } from "@/api";
+import ResizeTable, { ResizeColumnType } from "@/components/ResizeTable";
+
+export interface DataSourceTableProps {
+  project?: string;
+}
+
+export interface SearchModel {
+  scope?: string;
+  roleName?: string;
+}
+
+const DataSourceTable = (props: DataSourceTableProps, ref: any) => {
+  const navigate = useNavigate();
+
+  const { project } = props;
+
+  const projectRef = useRef(project);
+
+  const getDetialUrl = (guid: string) => {
+    return `/projects/${projectRef.current}/dataSources/${guid}`;
+  };
+
+  const columns: ResizeColumnType<DataSource>[] = [
+    {
+      key: "name",
+      title: "Name",
+      ellipsis: true,
+      width: 200,
+      render: (record: DataSource) => {
+        return (
+          <Button
+            type="link"
+            onClick={() => {
+              navigate(getDetialUrl(record.guid));
+            }}
+          >
+            {record.displayText}
+          </Button>
+        );
+      },
+    },
+    {
+      key: "type",
+      title: "Type",
+      ellipsis: true,
+      width: 80,
+      render: (record: DataSource) => {
+        return record.attributes.type;
+      },
+    },
+    {
+      key: "path",
+      title: "Path",
+      width: 220,
+      render: (record: DataSource) => {
+        return record.attributes.path;
+      },
+    },
+    {
+      key: "preprocessing",
+      title: "Preprocessing",
+      ellipsis: true,
+      width: 190,
+      render: (record: DataSource) => {
+        return record.attributes.preprocessing;
+      },
+    },
+    {
+      key: "eventTimestampColumn",
+      title: "Event Timestamp Column",
+      ellipsis: true,
+      width: 190,
+      render: (record: DataSource) => {
+        return record.attributes.eventTimestampColumn;
+      },
+    },
+    {
+      key: "timestampFormat",
+      title: "Timestamp Format",
+      ellipsis: true,
+      width: 190,
+      render: (record: DataSource) => {
+        return record.attributes.timestampFormat;
+      },
+    },
+    {
+      title: "Action",
+      fixed: "right",
+      width: 130,
+      resize: false,
+      render: (record: DataSource) => {
+        return (
+          <Button
+            type="primary"
+            ghost
+            onClick={() => {
+              navigate(getDetialUrl(record.guid));
+            }}
+          >
+            View Details
+          </Button>
+        );
+      },
+    },
+  ];
+
+  const { isLoading, data: tableData } = useQuery<DataSource[]>(
+    ["dataSources", project],
+    async () => {
+      if (project) {
+        projectRef.current = project;
+        return await fetchDataSources(project);
+      } else {
+        return [];
+      }
+    },
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
+  );
+
+  return (
+    <ResizeTable
+      rowKey="guid"
+      loading={isLoading}
+      columns={columns}
+      dataSource={tableData}
+      scroll={{ x: "100%" }}
+    />
+  );
+};
+
+const DataSourceTableComponent = forwardRef<unknown, DataSourceTableProps>(
+  DataSourceTable
+);
+
+DataSourceTableComponent.displayName = "DataSourceTableComponent";
+
+export default DataSourceTableComponent;
diff --git a/ui/src/pages/dataSource/components/SearchBar/index.tsx b/ui/src/pages/dataSource/components/SearchBar/index.tsx
new file mode 100644
index 000000000..9577bae35
--- /dev/null
+++ b/ui/src/pages/dataSource/components/SearchBar/index.tsx
@@ -0,0 +1,38 @@
+import React from "react";
+import { Form } from "antd";
+import ProjectsSelect from "@/components/ProjectsSelect";
+
+export interface SearchBarProps {
+  defaultProject?: string;
+  onSearch: (values: any) => void;
+}
+
+const { Item } = Form;
+
+const SearchBar = (props: SearchBarProps) => {
+  const [form] = Form.useForm();
+
+  const { defaultProject, onSearch } = props;
+
+  return (
+    <div
+      style={{
+        display: "flex",
+        justifyContent: "space-between",
+        marginBottom: 16,
+      }}
+    >
+      <Form layout="inline" form={form} onFinish={onSearch}>
+        <Item
+          label="Select Project"
+          name="project"
+          initialValue={defaultProject}
+        >
+          <ProjectsSelect onChange={form.submit} />
+        </Item>
+      </Form>
+    </div>
+  );
+};
+
+export default SearchBar;
diff --git a/ui/src/pages/dataSource/dataSourceDetails.tsx b/ui/src/pages/dataSource/dataSourceDetails.tsx
index 2548644b2..af82fe0d7 100644
--- a/ui/src/pages/dataSource/dataSourceDetails.tsx
+++ b/ui/src/pages/dataSource/dataSourceDetails.tsx
@@ -1,112 +1,85 @@
 import React from "react";
 import { LoadingOutlined } from "@ant-design/icons";
 import { useNavigate, useParams } from "react-router-dom";
-import { Alert, Button, Card, Col, Row, Spin, Typography } from "antd";
-import { QueryStatus, useQuery } from "react-query";
+import { Alert, Space, Breadcrumb, PageHeader, Spin, Button } from "antd";
+import { Link } from "react-router-dom";
+import { useQuery } from "react-query";
 import { AxiosError } from "axios";
-import { fetchDataSource } from "../../api";
-import { DataSource, DataSourceAttributes } from "../../models/model";
-
-const { Title } = Typography;
-
-type DataSourceKeyProps = { dataSource: DataSource };
-const DataSourceKey = ({ dataSource }: DataSourceKeyProps) => {
-  const keys = dataSource.attributes;
-  return (
-    <>
-      {keys && (
-        <Col span={24}>
-          <Card className="card">
-            <Title level={4}>Data Source Attributes</Title>
-            <div className="dataSource-container">
-              <p>Name: {keys.name}</p>
-              <p>Type: {keys.type}</p>
-              <p>Path: {keys.path}</p>
-              <p>Preprocessing: {keys.preprocessing}</p>
-              <p>Event Timestamp Column: {keys.eventTimestampColumn}</p>
-              <p>Timestamp Format: {keys.timestampFormat}</p>
-              <p>Qualified Name: {keys.qualifiedName}</p>
-              <p>Tags: {JSON.stringify(keys.tags)}</p>
-            </div>
-          </Card>
-        </Col>
-      )}
-    </>
-  );
-};
-
-type Params = {
-  project: string;
-  dataSourceId: string;
-};
+import { fetchDataSource } from "@/api";
+import { DataSource } from "@/models/model";
+import { SourceAttributesMap } from "@/utils/attributesMapping";
+import CardDescriptions from "@/components/CardDescriptions";
 
 const DataSourceDetails = () => {
-  const { project, dataSourceId } = useParams() as Params;
   const navigate = useNavigate();
-  const loadingIcon = <LoadingOutlined style={{ fontSize: 24 }} spin />;
-  const { status, error, data } = useQuery<DataSource, AxiosError>(
+
+  const { project = "", dataSourceId = "" } = useParams();
+
+  const {
+    isLoading,
+    error,
+    data = { attributes: {} } as DataSource,
+  } = useQuery<DataSource, AxiosError>(
     ["dataSourceId", dataSourceId],
-    () => fetchDataSource(project, dataSourceId)
+    () => fetchDataSource(project, dataSourceId),
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
   );
 
-  const render = (status: QueryStatus): JSX.Element => {
-    switch (status) {
-      case "error":
-        return (
-          <Card>
-            <Alert
-              message="Error"
-              description={error?.message}
-              type="error"
-              showIcon
-            />
-          </Card>
-        );
-      case "idle":
-        return (
-          <Card>
-            <Spin indicator={loadingIcon} />
-          </Card>
-        );
-      case "loading":
-        return (
-          <Card>
-            <Spin indicator={loadingIcon} />
-          </Card>
-        );
-      case "success":
-        if (data === undefined) {
-          return (
-            <Card>
-              <Alert
-                message="Error"
-                description="Data does not exist..."
-                type="error"
-                showIcon
-              />
-            </Card>
-          );
-        } else {
-          return (
-            <>
-              <Button type="link" onClick={() => navigate(-1)}>
-                dataSource list {">"}
-              </Button>
-              <Card>
-                <Title level={3}>{data.attributes.name}</Title>
-                <div>
-                  <Row>
-                    <DataSourceKey dataSource={data} />
-                  </Row>
-                </div>
-              </Card>
-            </>
-          );
-        }
-    }
-  };
+  const { attributes } = data;
 
-  return <div className="page">{render(status)}</div>;
+  return (
+    <div className="page">
+      <PageHeader
+        ghost={false}
+        title="Data Source Attributes"
+        breadcrumb={
+          <Breadcrumb>
+            <Breadcrumb.Item>
+              <Link to={`/dataSources?project=${project}`}>Data Sources</Link>
+            </Breadcrumb.Item>
+            <Breadcrumb.Item>Data Source Attributes</Breadcrumb.Item>
+          </Breadcrumb>
+        }
+        extra={[
+          <Button
+            key="1"
+            ghost
+            type="primary"
+            onClick={() => {
+              navigate(`/features?project=${project}`);
+            }}
+          >
+            View Features
+          </Button>,
+          <Button
+            key="2"
+            type="primary"
+            onClick={() => {
+              navigate(`/projects/${project}/lineage`);
+            }}
+          >
+            View Lineage
+          </Button>,
+        ]}
+      >
+        <Spin
+          spinning={isLoading}
+          indicator={<LoadingOutlined style={{ fontSize: 24 }} spin />}
+        >
+          <Space className="display-flex" direction="vertical" size="middle">
+            {error && <Alert message={error} type="error" showIcon />}
+            <CardDescriptions
+              mapping={SourceAttributesMap}
+              descriptions={attributes}
+            />
+          </Space>
+        </Spin>
+      </PageHeader>
+    </div>
+  );
 };
 
 export default DataSourceDetails;
diff --git a/ui/src/pages/dataSource/dataSources.tsx b/ui/src/pages/dataSource/dataSources.tsx
index 6d84aa0af..c36db0b12 100644
--- a/ui/src/pages/dataSource/dataSources.tsx
+++ b/ui/src/pages/dataSource/dataSources.tsx
@@ -1,20 +1,27 @@
-import { Card, Typography } from "antd";
+import { PageHeader } from "antd";
+import { useState } from "react";
 import { useSearchParams } from "react-router-dom";
-import DataSourceList from "../../components/dataSourceList";
 
-const { Title } = Typography;
+import DataSourceTable from "./components/DataSourceTable";
+import SearchBar from "./components/SearchBar";
 
 const DataSources = () => {
   const [searchParams] = useSearchParams();
-  const project = (searchParams.get("project") as string) ?? "";
-  const keyword = (searchParams.get("keyword") as string) ?? "";
+
+  const [project, setProject] = useState<string | undefined>(
+    searchParams.get("project") || undefined
+  );
+
+  const onSearch = ({ project }: { project: string }) => {
+    setProject(project);
+  };
 
   return (
     <div className="page">
-      <Card>
-        <Title level={3}>Data Sources</Title>
-        <DataSourceList projectProp={project} keywordProp={keyword} />
-      </Card>
+      <PageHeader ghost={false} title="Data Sources">
+        <SearchBar defaultProject={project} onSearch={onSearch} />
+        <DataSourceTable project={project} />
+      </PageHeader>
     </div>
   );
 };
diff --git a/ui/src/pages/feature/components/FeatureForm/index.tsx b/ui/src/pages/feature/components/FeatureForm/index.tsx
new file mode 100644
index 000000000..02f33fe8d
--- /dev/null
+++ b/ui/src/pages/feature/components/FeatureForm/index.tsx
@@ -0,0 +1,87 @@
+import React, { forwardRef, useEffect, useState } from "react";
+import { Button, Form, Input, message } from "antd";
+import { useNavigate } from "react-router-dom";
+import { createFeature, updateFeature } from "@/api";
+import { FeatureAttributes, Feature } from "@/models/model";
+
+export interface FeatureFormProps {
+  isNew: boolean;
+  editMode: boolean;
+  feature?: FeatureAttributes;
+}
+
+const FeatureForm = (props: FeatureFormProps, ref: any) => {
+  const navigate = useNavigate();
+
+  const { isNew, editMode, feature } = props;
+
+  const [createLoading, setCreateLoading] = useState<boolean>(false);
+
+  const [form] = Form.useForm();
+
+  const handleFinish = async (values: Feature) => {
+    setCreateLoading(true);
+    try {
+      if (isNew) {
+        await createFeature(values);
+        message.success("New feature created");
+      } else if (feature?.qualifiedName) {
+        values.guid = feature.qualifiedName;
+        await updateFeature(values);
+        message.success("Feature is updated successfully");
+      }
+      navigate("/features");
+    } catch (err: any) {
+      message.error(err.detail || err.message, 8);
+    } finally {
+      setCreateLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    if (feature) {
+      form.setFieldsValue(feature);
+    }
+  }, [feature, form]);
+
+  return (
+    <>
+      <Form
+        style={{ margin: "0 auto", maxWidth: 600 }}
+        layout="vertical"
+        form={form}
+        onFinish={handleFinish}
+        disabled={!editMode}
+      >
+        <Form.Item name="name" label="Name">
+          <Input />
+        </Form.Item>
+        <Form.Item name="description" label="Description">
+          <Input />
+        </Form.Item>
+        <Form.Item name="type" label="Type">
+          <Input />
+        </Form.Item>
+        <Form.Item name="dataSource" label="Data Source">
+          <Input />
+        </Form.Item>
+        <Form.Item>
+          <Button
+            type="primary"
+            htmlType="submit"
+            title="submit and go back to list"
+            loading={createLoading}
+          >
+            Submit
+          </Button>
+        </Form.Item>
+      </Form>
+    </>
+  );
+};
+
+const FeatureFormComponent = forwardRef<unknown, FeatureFormProps>(FeatureForm);
+
+FeatureFormComponent.displayName = "FeatureFormComponent";
+
+export default FeatureFormComponent;
diff --git a/ui/src/pages/feature/components/FeatureTable/index.tsx b/ui/src/pages/feature/components/FeatureTable/index.tsx
new file mode 100644
index 000000000..69e9c1ae6
--- /dev/null
+++ b/ui/src/pages/feature/components/FeatureTable/index.tsx
@@ -0,0 +1,151 @@
+import React, { forwardRef, useRef } from "react";
+import { Button } from "antd";
+import { useQuery } from "react-query";
+import { useNavigate } from "react-router-dom";
+import { Feature } from "@/models/model";
+import { fetchFeatures } from "@/api";
+import ResizeTable, { ResizeColumnType } from "@/components/ResizeTable";
+
+export interface DataSourceTableProps {
+  project?: string;
+  keyword?: string;
+}
+
+export interface SearchModel {
+  scope?: string;
+  roleName?: string;
+}
+
+const DataSourceTable = (props: DataSourceTableProps, ref: any) => {
+  const navigate = useNavigate();
+
+  const { project, keyword } = props;
+
+  const projectRef = useRef(project);
+
+  const getDetialUrl = (guid: string) => {
+    return `/projects/${projectRef.current}/features/${guid}`;
+  };
+
+  const columns: ResizeColumnType<Feature>[] = [
+    {
+      key: "name",
+      title: "Name",
+      ellipsis: true,
+      width: 200,
+      render: (record: Feature) => {
+        return (
+          <Button
+            type="link"
+            onClick={() => {
+              navigate(getDetialUrl(record.guid));
+            }}
+          >
+            {record.displayText}
+          </Button>
+        );
+      },
+    },
+    {
+      key: "type",
+      title: "Type",
+      ellipsis: true,
+      width: 120,
+      render: (record: Feature) => {
+        return record.typeName.replace(/feathr_|_v1/gi, "");
+      },
+    },
+    {
+      key: "transformation",
+      title: "Transformation",
+      width: 220,
+      render: (record: Feature) => {
+        const { transformExpr, defExpr } = record.attributes.transformation;
+        return transformExpr || defExpr;
+      },
+    },
+    {
+      key: "entitykey",
+      title: "Entity Key",
+      ellipsis: true,
+      width: 120,
+      render: (record: Feature) => {
+        const key = record.attributes.key && record.attributes.key[0];
+        if ("NOT_NEEDED" !== key.keyColumn) {
+          return `${key.keyColumn} (${key.keyColumnType})`;
+        } else {
+          return "N/A";
+        }
+      },
+    },
+    {
+      key: "aggregation",
+      title: "Aggregation",
+      ellipsis: true,
+      width: 150,
+      render: (record: Feature) => {
+        const { transformation } = record.attributes;
+        return (
+          <>
+            {transformation.aggFunc && `Type: ${transformation.aggFunc}`}
+            <br />
+            {transformation.aggFunc && `Window: ${transformation.window}`}
+          </>
+        );
+      },
+    },
+    {
+      title: "Action",
+      fixed: "right",
+      width: 100,
+      resize: false,
+      render: (record: Feature) => {
+        return (
+          <Button
+            type="primary"
+            ghost
+            onClick={() => {
+              navigate(getDetialUrl(record.guid));
+            }}
+          >
+            View Details
+          </Button>
+        );
+      },
+    },
+  ];
+
+  const { isLoading, data: tableData } = useQuery<Feature[]>(
+    ["dataSources", project, keyword],
+    async () => {
+      if (project) {
+        projectRef.current = project;
+        return await fetchFeatures(project, 1, 10, keyword || "");
+      } else {
+        return [];
+      }
+    },
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
+  );
+
+  return (
+    <ResizeTable
+      rowKey="guid"
+      loading={isLoading}
+      columns={columns}
+      dataSource={tableData}
+      scroll={{ x: "100%" }}
+    />
+  );
+};
+
+const DataSourceTableComponent = forwardRef<unknown, DataSourceTableProps>(
+  DataSourceTable
+);
+
+DataSourceTableComponent.displayName = "DataSourceTableComponent";
+
+export default DataSourceTableComponent;
diff --git a/ui/src/pages/feature/components/NodeDetails/FeatureNodeDetail.tsx b/ui/src/pages/feature/components/NodeDetails/FeatureNodeDetail.tsx
new file mode 100644
index 000000000..868c866a7
--- /dev/null
+++ b/ui/src/pages/feature/components/NodeDetails/FeatureNodeDetail.tsx
@@ -0,0 +1,44 @@
+import React from "react";
+import { Space } from "antd";
+import { Feature } from "@/models/model";
+import CardDescriptions from "@/components/CardDescriptions";
+import {
+  TransformationMap,
+  FeatureKeyMap,
+  TypeMap,
+} from "@/utils/attributesMapping";
+
+export interface FeatureNodeDetialProps {
+  feature: Feature;
+}
+
+const FeatureNodeDetial = (props: FeatureNodeDetialProps) => {
+  const { feature } = props;
+
+  const { attributes } = feature;
+  const { transformation, key, type } = attributes;
+  const FeatureKey = key?.[0];
+
+  return (
+    <Space
+      className="display-flex"
+      direction="vertical"
+      size="middle"
+      align="start"
+    >
+      <CardDescriptions
+        title="Transformation"
+        mapping={TransformationMap}
+        descriptions={transformation}
+      />
+      <CardDescriptions
+        title="Entity Key"
+        mapping={FeatureKeyMap}
+        descriptions={FeatureKey}
+      />
+      <CardDescriptions title="Type" mapping={TypeMap} descriptions={type} />
+    </Space>
+  );
+};
+
+export default FeatureNodeDetial;
diff --git a/ui/src/pages/feature/components/NodeDetails/SourceNodeDetial.tsx b/ui/src/pages/feature/components/NodeDetails/SourceNodeDetial.tsx
new file mode 100644
index 000000000..fbf5be158
--- /dev/null
+++ b/ui/src/pages/feature/components/NodeDetails/SourceNodeDetial.tsx
@@ -0,0 +1,22 @@
+import React from "react";
+import { DataSource } from "@/models/model";
+import { SourceAttributesMap } from "@/utils/attributesMapping";
+import CardDescriptions from "@/components/CardDescriptions";
+
+export interface SourceNodeDetialProps {
+  source: DataSource;
+}
+
+const SourceNodeDetial = (props: SourceNodeDetialProps) => {
+  const { source } = props;
+  const { attributes } = source;
+  return (
+    <CardDescriptions
+      title="Source Attributes"
+      mapping={SourceAttributesMap}
+      descriptions={attributes}
+    />
+  );
+};
+
+export default SourceNodeDetial;
diff --git a/ui/src/pages/feature/components/NodeDetails/index.tsx b/ui/src/pages/feature/components/NodeDetails/index.tsx
new file mode 100644
index 000000000..8a3391cfd
--- /dev/null
+++ b/ui/src/pages/feature/components/NodeDetails/index.tsx
@@ -0,0 +1,63 @@
+import React from "react";
+import { useParams, useSearchParams } from "react-router-dom";
+import { fetchFeature, fetchDataSource } from "@/api";
+import { LoadingOutlined } from "@ant-design/icons";
+import { useQuery } from "react-query";
+import { Spin, Typography } from "antd";
+import { FeatureType } from "@/utils/utils";
+import FeatureNodeDetail from "./FeatureNodeDetail";
+import SourceNodeDetial from "./SourceNodeDetial";
+
+const { Paragraph } = Typography;
+
+const NodeDetails = () => {
+  const [searchParams] = useSearchParams();
+  const { project } = useParams();
+  const nodeId = searchParams.get("nodeId") as string;
+  const featureType = searchParams.get("featureType") as string;
+
+  const isSource = featureType === FeatureType.Source;
+  const isFeature =
+    featureType === FeatureType.AnchorFeature ||
+    featureType === FeatureType.DerivedFeature;
+
+  const { isLoading, data } = useQuery<any | null>(
+    ["nodeDetails", project, nodeId],
+    async () => {
+      if (isSource || isFeature) {
+        const api = isSource ? fetchDataSource : fetchFeature;
+        return await api(project!, nodeId);
+      }
+    },
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
+  );
+
+  return (
+    <Spin
+      spinning={isLoading}
+      indicator={<LoadingOutlined style={{ fontSize: 36 }} spin />}
+    >
+      <div style={{ minHeight: "calc(100vh - 300px)" }}>
+        {data ? (
+          isSource ? (
+            <SourceNodeDetial source={data} />
+          ) : (
+            <FeatureNodeDetail feature={data} />
+          )
+        ) : (
+          !isLoading && (
+            <Paragraph>
+              Click on source or feature node to show metadata and metric
+              details
+            </Paragraph>
+          )
+        )}
+      </div>
+    </Spin>
+  );
+};
+
+export default NodeDetails;
diff --git a/ui/src/pages/feature/components/SearchBar/index.tsx b/ui/src/pages/feature/components/SearchBar/index.tsx
new file mode 100644
index 000000000..1a32f28b2
--- /dev/null
+++ b/ui/src/pages/feature/components/SearchBar/index.tsx
@@ -0,0 +1,67 @@
+import React, { useRef } from "react";
+import { Form, Input, Button } from "antd";
+import { useNavigate } from "react-router-dom";
+import ProjectsSelect from "@/components/ProjectsSelect";
+
+export interface SearchValue {
+  project?: string;
+  keyword?: string;
+}
+
+export interface SearchBarProps {
+  defaultValues?: SearchValue;
+  onSearch?: (values: SearchValue) => void;
+}
+
+const { Item } = Form;
+
+const SearchBar = (props: SearchBarProps) => {
+  const [form] = Form.useForm();
+
+  const navigate = useNavigate();
+
+  const { defaultValues, onSearch } = props;
+
+  const timeRef = useRef<any>(null);
+
+  const onChangeKeyword = () => {
+    clearTimeout(timeRef.current);
+    timeRef.current = setTimeout(() => {
+      form.submit();
+    }, 350);
+  };
+
+  return (
+    <div
+      style={{
+        display: "flex",
+        justifyContent: "space-between",
+        marginBottom: 16,
+      }}
+    >
+      <Form
+        layout="inline"
+        form={form}
+        onFinish={onSearch}
+        initialValues={defaultValues}
+      >
+        <Item label="Select Project" name="project">
+          <ProjectsSelect onChange={form.submit} />
+        </Item>
+        <Item name="keyword">
+          <Input placeholder="keyword" onChange={onChangeKeyword} />
+        </Item>
+      </Form>
+      <Button
+        type="primary"
+        onClick={() => {
+          navigate("/new-feature");
+        }}
+      >
+        + Create Feature
+      </Button>
+    </div>
+  );
+};
+
+export default SearchBar;
diff --git a/ui/src/pages/feature/featureDetails.tsx b/ui/src/pages/feature/featureDetails.tsx
index 549e5e3f7..fdecb7505 100644
--- a/ui/src/pages/feature/featureDetails.tsx
+++ b/ui/src/pages/feature/featureDetails.tsx
@@ -1,218 +1,116 @@
-import React, { useEffect, useState } from "react";
-import { Alert, Button, Card, Col, Row, Space, Spin, Typography } from "antd";
+import React, { useEffect, useRef, useState } from "react";
+import {
+  Alert,
+  Button,
+  PageHeader,
+  Breadcrumb,
+  Space,
+  Card,
+  Spin,
+  Descriptions,
+} from "antd";
 import { LoadingOutlined } from "@ant-design/icons";
-import { useNavigate, useParams } from "react-router-dom";
-import { QueryStatus, useQuery } from "react-query";
+import { Link, useNavigate, useParams } from "react-router-dom";
+import { useQuery } from "react-query";
 import { AxiosError } from "axios";
-import { fetchFeature } from "../../api";
-import { Feature, InputFeature } from "../../models/model";
-import { FeatureLineage } from "../../models/model";
-import { fetchFeatureLineages } from "../../api";
-import { Elements } from "react-flow-renderer";
-import Graph from "../../components/graph/graph";
-import { getElements } from "../../components/graph/utils";
-
-const { Title } = Typography;
-
-type FeatureKeyProps = { feature: Feature };
-const FeatureKey = ({ feature }: FeatureKeyProps) => {
-  const keys = feature.attributes.key;
-  return (
-    <>
-      {keys && keys.length > 0 && (
-        <Col span={24}>
-          <Card className="card">
-            <Title level={4}>Entity Key</Title>
-            <div className="feature-container">
-              <p>Full Name: {keys[0].fullName}</p>
-              <p>Key Column: {keys[0].keyColumn}</p>
-              <p>Description: {keys[0].description}</p>
-              <p>Key Column Alias: {keys[0].keyColumnAlias}</p>
-              <p>Key Column Type: {keys[0].keyColumnType}</p>
-            </div>
-          </Card>
-        </Col>
-      )}
-    </>
-  );
-};
-
-type FeatureTypeProps = { feature: Feature };
-const FeatureType = ({ feature }: FeatureTypeProps) => {
-  const type = feature.attributes.type;
-  return (
-    <>
-      {type && (
-        <Col span={24}>
-          <Card className="card">
-            <Title level={4}>Type</Title>
-            <div className="feature-container">
-              <p>Dimension Type: {type.dimensionType}</p>
-              <p>Tensor Category: {type.tensorCategory}</p>
-              <p>Type: {type.type}</p>
-              <p>Value Type: {type.valType}</p>
-            </div>
-          </Card>
-        </Col>
-      )}
-    </>
-  );
-};
-
-type FeatureTransformationProps = { feature: Feature };
-const FeatureTransformation = ({ feature }: FeatureTransformationProps) => {
-  const transformation = feature.attributes.transformation;
-  return (
-    <>
-      {transformation && (
-        <Col span={24}>
-          <Card className="card">
-            <Title level={4}>Transformation</Title>
-            <div className="feature-container">
-              {transformation.transformExpr && (
-                <p>Expression: {transformation.transformExpr}</p>
-              )}
-              {transformation.filter && <p>Filter: {transformation.filter}</p>}
-              {transformation.aggFunc && (
-                <p>Aggregation: {transformation.aggFunc}</p>
-              )}
-              {transformation.limit && <p>Limit: {transformation.limit}</p>}
-              {transformation.groupBy && (
-                <p>Group By: {transformation.groupBy}</p>
-              )}
-              {transformation.window && <p>Window: {transformation.window}</p>}
-              {transformation.defExpr && (
-                <p>Expression: {transformation.defExpr}</p>
-              )}
-            </div>
-          </Card>
-        </Col>
-      )}
-    </>
-  );
-};
+import { fetchFeature, fetchFeatureLineages } from "@/api";
+import { Feature, InputFeature, FeatureLineage } from "@/models/model";
+import FlowGraph from "@/components/FlowGraph";
+import CardDescriptions from "@/components/CardDescriptions";
+import {
+  FeatureKeyMap,
+  TransformationMap,
+  TypeMap,
+} from "@/utils/attributesMapping";
+
+const contentStyle = { marginRight: 16 };
 
 type InputAnchorFeaturesProps = { project: string; feature: Feature };
-const InputAnchorFeatures = ({
-  project,
-  feature,
-}: InputAnchorFeaturesProps) => {
-  const navigate = useNavigate();
-  const inputAnchorFeatures = feature.attributes.inputAnchorFeatures;
-  return (
-    <>
-      {inputAnchorFeatures && inputAnchorFeatures.length > 0 && (
-        <Col span={24}>
-          <Card
-            style={{
-              marginTop: "15px",
-              marginRight: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
-            <Title level={4}>Input Anchor Features</Title>
-            {inputAnchorFeatures.map((input_feature) => (
-              <Button
-                type="link"
-                onClick={() => {
-                  navigate(
-                    `/projects/${project}/features/${input_feature.guid}`
-                  );
-                }}
-              >
-                {input_feature.uniqueAttributes.qualifiedName}
-              </Button>
-            ))}
-          </Card>
-        </Col>
-      )}
-    </>
-  );
+
+const InputAnchorFeatures = (props: InputAnchorFeaturesProps) => {
+  const { project, feature } = props;
+
+  const { inputAnchorFeatures } = feature.attributes;
+
+  return inputAnchorFeatures?.length > 0 ? (
+    <Card className="card" title="Input Anchor Features">
+      <Descriptions contentStyle={contentStyle}>
+        {inputAnchorFeatures.map((input_feature) => (
+          <Descriptions.Item key={input_feature.guid}>
+            <Link to={`/projects/${project}/features/${input_feature.guid}`}>
+              {input_feature.uniqueAttributes.qualifiedName}
+            </Link>
+          </Descriptions.Item>
+        ))}
+      </Descriptions>
+    </Card>
+  ) : null;
 };
 
 type InputDerivedFeaturesProps = { project: string; feature: Feature };
-const InputDerivedFeatures = ({
-  project,
-  feature,
-}: InputDerivedFeaturesProps) => {
-  const navigate = useNavigate();
-  const inputDerivedFeatures = feature.attributes.inputDerivedFeatures;
-  return (
-    <>
-      {inputDerivedFeatures && inputDerivedFeatures.length > 0 && (
-        <Col span={24}>
-          <Card
-            style={{
-              marginTop: "15px",
-              marginRight: "15px",
-              boxShadow: "5px 8px 15px 5px rgba(208, 216, 243, 0.6)",
-              borderRadius: "8px",
-            }}
-          >
-            <Title level={4}>Input Derived Features</Title>
-            {inputDerivedFeatures.map((input_feature: InputFeature) => (
-              <Button
-                type="link"
-                onClick={() => {
-                  navigate(
-                    `/projects/${project}/features/${input_feature.guid}`
-                  );
-                }}
-              >
-                {input_feature.uniqueAttributes.qualifiedName}
-              </Button>
-            ))}
-          </Card>
-        </Col>
-      )}
-    </>
-  );
+
+const InputDerivedFeatures = (props: InputDerivedFeaturesProps) => {
+  const { project, feature } = props;
+
+  const { inputDerivedFeatures } = feature.attributes;
+
+  return inputDerivedFeatures?.length ? (
+    <Card className="card" title="Input Derived Features">
+      <Descriptions contentStyle={contentStyle}>
+        {inputDerivedFeatures.map((input_feature: InputFeature) => (
+          <Descriptions.Item key={input_feature.guid}>
+            <Link to={`/projects/${project}/features/${input_feature.guid}`}>
+              {input_feature.uniqueAttributes.qualifiedName}
+            </Link>
+          </Descriptions.Item>
+        ))}
+      </Descriptions>
+    </Card>
+  ) : null;
 };
 
 const FeatureLineageGraph = () => {
-  const { featureId } = useParams() as Params;
+  const { project, featureId } = useParams() as Params;
   const [lineageData, setLineageData] = useState<FeatureLineage>({
-    guidEntityMap: null,
-    relations: null,
+    guidEntityMap: {},
+    relations: [],
   });
-  const [elements, SetElements] = useState<Elements>([]);
+
   const [loading, setLoading] = useState<boolean>(false);
 
+  const mountedRef = useRef<Boolean>(true);
+
   useEffect(() => {
     const fetchLineageData = async () => {
       setLoading(true);
       const data = await fetchFeatureLineages(featureId);
-      setLineageData(data);
-      setLoading(false);
+      if (mountedRef.current) {
+        setLineageData(data);
+        setLoading(false);
+      }
     };
 
     fetchLineageData();
   }, [featureId]);
 
-  // Generate graph data on client side, invoked after graphData or featureType is changed
   useEffect(() => {
-    const generateGraphData = async () => {
-      SetElements(getElements(lineageData, "all_nodes")!);
+    mountedRef.current = true;
+    return () => {
+      mountedRef.current = false;
     };
-
-    generateGraphData();
-  }, [lineageData]);
-
-  return (
-    <>
-      {loading ? (
-        <Spin indicator={<LoadingOutlined style={{ fontSize: 24 }} spin />} />
-      ) : (
-        <Col span={24}>
-          <Card className="card">
-            <Title level={4}>Lineage</Title>
-            <Graph data={elements} nodeId={featureId} />
-          </Card>
-        </Col>
-      )}
-    </>
-  );
+  }, []);
+
+  return !loading ? (
+    <Card className="card" title="Lineage">
+      <FlowGraph
+        height={500}
+        loading={loading}
+        data={lineageData}
+        nodeId={featureId}
+        project={project}
+      />
+    </Card>
+  ) : null;
 };
 
 type Params = {
@@ -222,87 +120,77 @@ type Params = {
 const FeatureDetails = () => {
   const { project, featureId } = useParams() as Params;
   const navigate = useNavigate();
-  const loadingIcon = <LoadingOutlined style={{ fontSize: 24 }} spin />;
-  const { status, error, data } = useQuery<Feature, AxiosError>(
+
+  const {
+    isLoading,
+    error,
+    data = { attributes: {} } as Feature,
+  } = useQuery<Feature, AxiosError>(
     ["featureId", featureId],
-    () => fetchFeature(project, featureId)
+    () => fetchFeature(project, featureId),
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
   );
+  const { attributes } = data;
+  const { transformation, key, type, name } = attributes;
+  const FeatureKey = key?.[0];
 
-  const openLineageWindow = () => {
-    const lineageUrl = `/projects/${project}/lineage`;
-    navigate(lineageUrl);
-  };
-
-  const render = (status: QueryStatus): JSX.Element => {
-    switch (status) {
-      case "error":
-        return (
-          <Card>
-            <Alert
-              message="Error"
-              description={error?.message}
-              type="error"
-              showIcon
-            />
-          </Card>
-        );
-      case "idle":
-        return (
-          <Card>
-            <Spin indicator={loadingIcon} />
-          </Card>
-        );
-      case "loading":
-        return (
-          <Card>
-            <Spin indicator={loadingIcon} />
-          </Card>
-        );
-      case "success":
-        if (data === undefined) {
-          return (
-            <Card>
-              <Alert
-                message="Error"
-                description="Data does not exist..."
-                type="error"
-                showIcon
-              />
-            </Card>
-          );
-        } else {
-          return (
-            <>
-              <Button type="link" onClick={() => navigate(-1)}>
-                feature list {">"}
-              </Button>
-              <Card>
-                <Title level={3}>{data.attributes.name}</Title>
-                <div>
-                  <Space>
-                    <Button type="primary" onClick={() => openLineageWindow()}>
-                      View Lineage
-                    </Button>
-                  </Space>
-                </div>
-                <div>
-                  <Row>
-                    <InputAnchorFeatures project={project} feature={data} />
-                    <InputDerivedFeatures project={project} feature={data} />
-                    <FeatureTransformation feature={data} />
-                    <FeatureKey feature={data} />
-                    <FeatureType feature={data} />
-                    <FeatureLineageGraph />
-                  </Row>
-                </div>
-              </Card>
-            </>
-          );
+  return (
+    <div className="page">
+      <PageHeader
+        ghost={false}
+        title={name}
+        breadcrumb={
+          <Breadcrumb>
+            <Breadcrumb.Item>
+              <Link to={`/features?project=${project}`}>Features</Link>
+            </Breadcrumb.Item>
+            <Breadcrumb.Item>Feature Details</Breadcrumb.Item>
+          </Breadcrumb>
         }
-    }
-  };
-
-  return <div className="page">{render(status)}</div>;
+        extra={[
+          <Button
+            key="1"
+            type="primary"
+            onClick={() => {
+              navigate(`/projects/${project}/lineage`);
+            }}
+          >
+            View Lineage
+          </Button>,
+        ]}
+      >
+        <Spin
+          spinning={isLoading}
+          indicator={<LoadingOutlined style={{ fontSize: 24 }} spin />}
+        >
+          <Space className="display-flex" direction="vertical" size="middle">
+            {error && <Alert message={error} type="error" showIcon />}
+            <InputAnchorFeatures project={project} feature={data} />
+            <InputDerivedFeatures project={project} feature={data} />
+            <CardDescriptions
+              title="Transformation"
+              mapping={TransformationMap}
+              descriptions={transformation}
+            />
+            <CardDescriptions
+              title="Entity Key"
+              mapping={FeatureKeyMap}
+              descriptions={FeatureKey}
+            />
+            <CardDescriptions
+              title="Type"
+              mapping={TypeMap}
+              descriptions={type}
+            />
+            <FeatureLineageGraph />
+          </Space>
+        </Spin>
+      </PageHeader>
+    </div>
+  );
 };
 
 export default FeatureDetails;
diff --git a/ui/src/pages/feature/features.tsx b/ui/src/pages/feature/features.tsx
index 275cde11f..9ace6ead6 100644
--- a/ui/src/pages/feature/features.tsx
+++ b/ui/src/pages/feature/features.tsx
@@ -1,20 +1,27 @@
-import { Button, Card, Space, Typography } from "antd";
-import { useNavigate, useSearchParams } from "react-router-dom";
-import FeatureList from "../../components/featureList";
-
-const { Title } = Typography;
+import { useState } from "react";
+import { PageHeader } from "antd";
+import { useSearchParams } from "react-router-dom";
+import SearchBar, { SearchValue } from "./components/SearchBar";
+import FeatureTable from "./components/FeatureTable";
 
 const Features = () => {
   const [searchParams] = useSearchParams();
-  const project = (searchParams.get("project") as string) ?? "";
-  const keyword = (searchParams.get("keyword") as string) ?? "";
+
+  const [search, setProject] = useState<SearchValue>({
+    project: searchParams.get("project") || undefined,
+    keyword: searchParams.get("keyword") || undefined,
+  });
+
+  const onSearch = (values: SearchValue) => {
+    setProject(values);
+  };
 
   return (
     <div className="page">
-      <Card>
-        <Title level={3}>Features</Title>
-        <FeatureList projectProp={project} keywordProp={keyword} />
-      </Card>
+      <PageHeader ghost={false} title="Features">
+        <SearchBar defaultValues={search} onSearch={onSearch} />
+        <FeatureTable project={search.project} keyword={search.keyword} />
+      </PageHeader>
     </div>
   );
 };
diff --git a/ui/src/pages/feature/lineageGraph.tsx b/ui/src/pages/feature/lineageGraph.tsx
index ac75dff91..d8b1473df 100644
--- a/ui/src/pages/feature/lineageGraph.tsx
+++ b/ui/src/pages/feature/lineageGraph.tsx
@@ -1,17 +1,17 @@
-import React, { useEffect, useState } from "react";
-import { Card, Col, Radio, Row, Spin, Tabs, Typography } from "antd";
+import React, { useEffect, useRef, useState } from "react";
+import { PageHeader, Row, Col, Radio, Tabs } from "antd";
 import { useParams, useSearchParams } from "react-router-dom";
-import { Elements } from "react-flow-renderer";
-import Graph from "../../components/graph/graph";
-import { fetchProjectLineages } from "../../api";
-import { FeatureLineage } from "../../models/model";
-import { LoadingOutlined } from "@ant-design/icons";
-import GraphNodeDetails from "../../components/graph/graphNodeDetails";
-import { getElements } from "../../components/graph/utils";
-import { FeatureType } from "../../utils/utils";
+import FlowGraph from "@/components/FlowGraph";
+import { fetchProjectLineages } from "@/api";
+import { FeatureLineage } from "@/models/model";
+import { FeatureType } from "@/utils/utils";
+import NodeDetails from "./components/NodeDetails";
 
-const { Title } = Typography;
-const { TabPane } = Tabs;
+const items = [
+  { label: "Metadata", key: "1", children: <NodeDetails /> },
+  { label: "Metrics", key: "2", children: <p>Under construction</p> }, // 务必填写 key
+  { label: "Jobs", key: "3", children: <p>Under construction</p> },
+];
 
 type Params = {
   project: string;
@@ -22,90 +22,75 @@ const LineageGraph = () => {
   const nodeId = searchParams.get("nodeId") as string;
 
   const [lineageData, setLineageData] = useState<FeatureLineage>({
-    guidEntityMap: null,
-    relations: null,
+    guidEntityMap: {},
+    relations: [],
   });
+
   const [loading, setLoading] = useState<boolean>(false);
-  const [elements, SetElements] = useState<Elements>([]);
-  const [featureType, setFeatureType] = useState<string | null>("all_nodes");
+
+  const [featureType, setFeatureType] = useState<FeatureType>(
+    FeatureType.AllNodes
+  );
+
+  const mountedRef = useRef<Boolean>(true);
 
   // Fetch lineage data from server side, invoked immediately after component is mounted
   useEffect(() => {
     const fetchLineageData = async () => {
       setLoading(true);
       const data = await fetchProjectLineages(project);
-      setLineageData(data);
-      setLoading(false);
+      if (mountedRef.current) {
+        setLineageData(data);
+        setLoading(false);
+      }
     };
 
     fetchLineageData();
   }, [project]);
 
-  // Generate graph data on client side, invoked after graphData or featureType is changed
+  const toggleFeatureType = (type: FeatureType) => {
+    setFeatureType(type);
+  };
+
   useEffect(() => {
-    const generateGraphData = async () => {
-      SetElements(getElements(lineageData, featureType)!);
+    mountedRef.current = true;
+    return () => {
+      mountedRef.current = false;
     };
-
-    generateGraphData();
-  }, [lineageData, featureType]);
-
-  const toggleFeatureType = (type: string) => {
-    setFeatureType((prevType: string | null) => {
-      if (prevType === type) {
-        return null;
-      }
-      return type;
-    });
-  };
+  }, []);
 
   return (
     <div className="page">
-      <Card>
-        <Title level={3}>Lineage {project}</Title>
-        <div>
-          <Radio.Group
-            value={featureType}
-            onChange={(e) => toggleFeatureType(e.target.value)}
-          >
-            <Radio.Button value={FeatureType.AllNodes}>All Nodes</Radio.Button>
-            <Radio.Button value={FeatureType.Source}> Source </Radio.Button>
-            <Radio.Button value={FeatureType.Anchor}>Anchor</Radio.Button>
-            <Radio.Button value={FeatureType.AnchorFeature}>
-              Anchor Feature
-            </Radio.Button>
-            <Radio.Button value={FeatureType.DerivedFeature}>
-              Derived Feature
-            </Radio.Button>
-          </Radio.Group>
-        </div>
-        <div>
-          {loading ? (
-            <Spin
-              indicator={<LoadingOutlined style={{ fontSize: 24 }} spin />}
+      <PageHeader title={`Lineage ${project}`} ghost={false}>
+        <Radio.Group
+          value={featureType}
+          onChange={(e) => toggleFeatureType(e.target.value)}
+        >
+          <Radio.Button value={FeatureType.AllNodes}>All Nodes</Radio.Button>
+          <Radio.Button value={FeatureType.Source}> Source </Radio.Button>
+          <Radio.Button value={FeatureType.AnchorFeature}>
+            Anchor Feature
+          </Radio.Button>
+          <Radio.Button value={FeatureType.DerivedFeature}>
+            Derived Feature
+          </Radio.Button>
+        </Radio.Group>
+        <Row>
+          <Col flex="2">
+            <FlowGraph
+              minHeight="calc(100vh - 215px)"
+              loading={loading}
+              data={lineageData}
+              nodeId={nodeId}
+              project={project}
+              featureType={featureType}
             />
-          ) : (
-            <Row>
-              <Col flex="2">
-                <Graph data={elements} nodeId={nodeId} />
-              </Col>
-              <Col flex="1">
-                <Tabs defaultActiveKey="1">
-                  <TabPane tab="Metadata" key="1">
-                    <GraphNodeDetails></GraphNodeDetails>
-                  </TabPane>
-                  <TabPane tab="Metrics" key="2">
-                    <p>Under construction</p>
-                  </TabPane>
-                  <TabPane tab="Jobs" key="3">
-                    <p>Under construction</p>
-                  </TabPane>
-                </Tabs>
-              </Col>
-            </Row>
-          )}
-        </div>
-      </Card>
+          </Col>
+          <Col flex="1">
+            <Tabs defaultActiveKey="1" items={items} />
+          </Col>
+        </Row>
+      </PageHeader>
     </div>
   );
 };
diff --git a/ui/src/pages/feature/newFeature.tsx b/ui/src/pages/feature/newFeature.tsx
index d51dd2aa0..50afd64c3 100644
--- a/ui/src/pages/feature/newFeature.tsx
+++ b/ui/src/pages/feature/newFeature.tsx
@@ -1,16 +1,13 @@
 import React from "react";
-import { Card, Typography } from "antd";
-import FeatureForm from "../../components/featureForm";
-
-const { Title } = Typography;
+import { PageHeader } from "antd";
+import FeatureForm from "./components/FeatureForm";
 
 const NewFeature = () => {
   return (
     <div className="page">
-      <Card>
-        <Title level={3}>Create Feature</Title>
+      <PageHeader title="Create Feature" ghost={false}>
         <FeatureForm isNew={true} editMode={true} />
-      </Card>
+      </PageHeader>
     </div>
   );
 };
diff --git a/ui/src/pages/management/components/RoleForm/index.tsx b/ui/src/pages/management/components/RoleForm/index.tsx
index 9e073abd8..0a77b1610 100644
--- a/ui/src/pages/management/components/RoleForm/index.tsx
+++ b/ui/src/pages/management/components/RoleForm/index.tsx
@@ -1,6 +1,6 @@
 import React, { forwardRef, useCallback, useEffect, useState } from "react";
 import { Form, Select, Input, Button, message } from "antd";
-import { listUserRole, addUserRole } from "../../../../api";
+import { listUserRole, addUserRole } from "@/api";
 
 export interface RoleFormProps {
   getRole?: (isAdmin: boolean) => void;
diff --git a/ui/src/pages/management/components/UserRolesTable/index.tsx b/ui/src/pages/management/components/UserRolesTable/index.tsx
index d264b2691..9a72f1539 100644
--- a/ui/src/pages/management/components/UserRolesTable/index.tsx
+++ b/ui/src/pages/management/components/UserRolesTable/index.tsx
@@ -6,12 +6,12 @@ import React, {
   useRef,
   useState,
 } from "react";
-import { Table, Tag, Button, message, Popconfirm } from "antd";
+import { Tag, Button, message, Popconfirm } from "antd";
 import { DeleteOutlined } from "@ant-design/icons";
-import { ColumnsType } from "antd/lib/table";
 import dayjs from "dayjs";
-import { UserRole } from "../../../../models/model";
-import { listUserRole, deleteUserRole } from "../../../../api";
+import { UserRole } from "@/models/model";
+import { listUserRole, deleteUserRole } from "@/api";
+import ResizeTable, { ResizeColumnType } from "@/components/ResizeTable";
 
 export interface UserRolesTableProps {}
 
@@ -74,25 +74,32 @@ const UserRolesTable = (props: UserRolesTableProps, ref: any) => {
     }
   };
 
-  const columns: ColumnsType<UserRole> = [
+  const columns: ResizeColumnType<UserRole>[] = [
     {
+      key: "scope",
       title: "Scope (Project / Global)",
       dataIndex: "scope",
       ellipsis: true,
+      width: 330,
+      minWidth: 190,
     },
     {
       title: "Role",
       dataIndex: "roleName",
+      ellipsis: true,
       width: 120,
     },
     {
       title: "User",
       dataIndex: "userName",
       ellipsis: true,
+      width: 300,
+      minWidth: 100,
     },
     {
       title: "Permissions",
       dataIndex: "access",
+      ellipsis: true,
       width: 240,
       render: (col: string[]) => {
         return col.map((tag) => {
@@ -110,6 +117,7 @@ const UserRolesTable = (props: UserRolesTableProps, ref: any) => {
       title: "Reason",
       dataIndex: "createReason",
       ellipsis: true,
+      width: 300,
     },
     {
       title: "Create By",
@@ -138,6 +146,7 @@ const UserRolesTable = (props: UserRolesTableProps, ref: any) => {
       title: "Action",
       fixed: "right",
       width: 130,
+      resize: false,
       render: (col: string, record: UserRole) => {
         return (
           <Popconfirm
@@ -170,12 +179,12 @@ const UserRolesTable = (props: UserRolesTableProps, ref: any) => {
   }, [fetchData]);
 
   return (
-    <Table
+    <ResizeTable
       rowKey="id"
       loading={loading}
       columns={columns}
       dataSource={tableData}
-      scroll={{ x: 1200 }}
+      scroll={{ x: "100%" }}
     />
   );
 };
diff --git a/ui/src/pages/management/management.tsx b/ui/src/pages/management/management.tsx
index 79ba50daa..882048b1f 100644
--- a/ui/src/pages/management/management.tsx
+++ b/ui/src/pages/management/management.tsx
@@ -18,7 +18,7 @@ const Management = () => {
   return (
     <div className="page">
       <Card>
-        <Space direction="vertical" style={{ width: "100%" }}>
+        <Space className="display-flex" direction="vertical">
           <Alert
             type="info"
             message="This page is protected by Feathr Access Control. Only Project Admins
diff --git a/ui/src/pages/management/roleManagement.tsx b/ui/src/pages/management/roleManagement.tsx
index b8b1b676d..5bc7b9a2d 100644
--- a/ui/src/pages/management/roleManagement.tsx
+++ b/ui/src/pages/management/roleManagement.tsx
@@ -14,7 +14,7 @@ const RoleManagement = () => {
   return (
     <div className="page">
       <Card>
-        <Space direction="vertical" style={{ width: "100%" }}>
+        <Space className="display-flex" direction="vertical">
           {showAlert && (
             <Alert
               type="warning"
diff --git a/ui/src/pages/project/components/ProjectTable/index.tsx b/ui/src/pages/project/components/ProjectTable/index.tsx
new file mode 100644
index 000000000..566d1443c
--- /dev/null
+++ b/ui/src/pages/project/components/ProjectTable/index.tsx
@@ -0,0 +1,99 @@
+import React, { forwardRef } from "react";
+import { Button, Space } from "antd";
+import { useQuery } from "react-query";
+import { useNavigate } from "react-router-dom";
+import { Project } from "@/models/model";
+import { fetchProjects } from "@/api";
+import ResizeTable, { ResizeColumnType } from "@/components/ResizeTable";
+
+export interface ProjectTableProps {
+  project?: string;
+}
+
+export interface SearchModel {
+  scope?: string;
+  roleName?: string;
+}
+
+const ProjectTable = (props: ProjectTableProps, ref: any) => {
+  const navigate = useNavigate();
+
+  const { project } = props;
+
+  const columns: ResizeColumnType<Project>[] = [
+    {
+      key: "name",
+      title: "Name",
+      dataIndex: "name",
+      resize: false,
+    },
+    {
+      key: "action",
+      title: "Action",
+      width: 130,
+      resize: false,
+      render: (record: Project) => {
+        const { name } = record;
+        return (
+          <Space size="middle">
+            <Button
+              type="primary"
+              ghost
+              onClick={() => {
+                navigate(`/features?project=${name}`);
+              }}
+            >
+              View Features
+            </Button>
+            <Button
+              type="primary"
+              ghost
+              onClick={() => {
+                navigate(`/projects/${name}/lineage`);
+              }}
+            >
+              View Lineage
+            </Button>
+          </Space>
+        );
+      },
+    },
+  ];
+
+  const { isLoading, data: tableData } = useQuery<Project[]>(
+    ["Projects", project],
+    async () => {
+      const reuslt = await fetchProjects();
+
+      return reuslt.reduce((list, item: string) => {
+        const text = project?.trim().toLocaleLowerCase();
+        if (!text || item.includes(text)) {
+          list.push({ name: item });
+        }
+        return list;
+      }, [] as Project[]);
+    },
+    {
+      retry: false,
+      refetchOnWindowFocus: false,
+    }
+  );
+
+  return (
+    <ResizeTable
+      rowKey="name"
+      loading={isLoading}
+      columns={columns}
+      dataSource={tableData}
+      scroll={{ x: "100%" }}
+    />
+  );
+};
+
+const ProjectTableComponent = forwardRef<unknown, ProjectTableProps>(
+  ProjectTable
+);
+
+ProjectTableComponent.displayName = "ProjectTableComponent";
+
+export default ProjectTableComponent;
diff --git a/ui/src/pages/project/components/SearchBar/index.tsx b/ui/src/pages/project/components/SearchBar/index.tsx
new file mode 100644
index 000000000..4ac3cd29d
--- /dev/null
+++ b/ui/src/pages/project/components/SearchBar/index.tsx
@@ -0,0 +1,51 @@
+import React, { forwardRef, useRef } from "react";
+import { Form, Input } from "antd";
+
+export interface SearchBarProps {
+  onSearch: (values: any) => void;
+}
+
+const { Item } = Form;
+
+const SearchBar = (props: SearchBarProps, ref: any) => {
+  const [form] = Form.useForm();
+
+  const { onSearch } = props;
+
+  const timeRef = useRef<any>(null);
+
+  const onChangeKeyword = () => {
+    clearTimeout(timeRef.current);
+    timeRef.current = setTimeout(() => {
+      form.submit();
+    }, 350);
+  };
+
+  return (
+    <div
+      style={{
+        display: "flex",
+        justifyContent: "space-between",
+        marginBottom: 16,
+      }}
+    >
+      <Form layout="inline" form={form} onFinish={onSearch}>
+        <Item label="Search" name="project">
+          <Input
+            placeholder="Search Name"
+            autoComplete="off"
+            allowClear
+            style={{ width: 260 }}
+            onChange={onChangeKeyword}
+          />
+        </Item>
+      </Form>
+    </div>
+  );
+};
+
+const SearchBarComponent = forwardRef<unknown, SearchBarProps>(SearchBar);
+
+SearchBarComponent.displayName = "SearchBarComponent";
+
+export default SearchBarComponent;
diff --git a/ui/src/pages/project/projects.tsx b/ui/src/pages/project/projects.tsx
index 03cbf3d48..932915089 100644
--- a/ui/src/pages/project/projects.tsx
+++ b/ui/src/pages/project/projects.tsx
@@ -1,16 +1,21 @@
-import React from "react";
-import { Card, Typography } from "antd";
-import ProjectList from "../../components/projectList";
-
-const { Title } = Typography;
+import React, { useState } from "react";
+import { PageHeader } from "antd";
+import ProjectTable from "./components/ProjectTable";
+import SearchBar from "./components/SearchBar";
 
 const Projects = () => {
+  const [project, setProject] = useState<string>("");
+
+  const onSearch = ({ project }: { project: string }) => {
+    setProject(project);
+  };
+
   return (
     <div className="page">
-      <Card>
-        <Title level={3}>Projects</Title>
-        <ProjectList />
-      </Card>
+      <PageHeader title="Projects" ghost={false}>
+        <SearchBar onSearch={onSearch} />
+        <ProjectTable project={project} />
+      </PageHeader>
     </div>
   );
 };
diff --git a/ui/src/site.css b/ui/src/site.css
index cea4439f7..e1a42a944 100644
--- a/ui/src/site.css
+++ b/ui/src/site.css
@@ -4,8 +4,6 @@
 }
 
 .card {
-  margin-top: 15px;
-  margin-right: 15px;
   box-shadow: 5px 8px 15px 5px rgba(208, 216, 243, 0.6);
   border-radius: 8px;
 }
@@ -61,3 +59,7 @@
 .dataSource-container {
   column-count: 1;
 }
+
+.display-flex {
+  display: "flex";
+}
diff --git a/ui/src/utils/attributesMapping.ts b/ui/src/utils/attributesMapping.ts
new file mode 100644
index 000000000..09e7459b7
--- /dev/null
+++ b/ui/src/utils/attributesMapping.ts
@@ -0,0 +1,48 @@
+import {
+  FeatureTransformation,
+  FeatureKey,
+  FeatureType,
+  DataSourceAttributes,
+} from "@/models/model";
+
+export const TransformationMap: Array<{
+  label: string;
+  key: keyof FeatureTransformation;
+}> = [
+  { label: "Expression", key: "transformExpr" },
+  { label: "Filter", key: "filter" },
+  { label: "Aggregation", key: "aggFunc" },
+  { label: "Limit", key: "limit" },
+  { label: "Group By", key: "groupBy" },
+  { label: "Window", key: "window" },
+  { label: "Expression", key: "defExpr" },
+];
+
+export const FeatureKeyMap: Array<{ label: string; key: keyof FeatureKey }> = [
+  { label: "Full name", key: "fullName" },
+  { label: "Description", key: "description" },
+  { label: "Key column", key: "keyColumn" },
+  { label: "Key column alias", key: "keyColumnAlias" },
+  { label: "Key column type", key: "keyColumnType" },
+];
+
+export const TypeMap: Array<{ label: string; key: keyof FeatureType }> = [
+  { label: "Dimension Type", key: "dimensionType" },
+  { label: "Tensor Category", key: "tensorCategory" },
+  { label: "Type", key: "type" },
+  { label: "Value Type", key: "valType" },
+];
+
+export const SourceAttributesMap: Array<{
+  label: string;
+  key: keyof DataSourceAttributes;
+}> = [
+  { label: "Name", key: "name" },
+  { label: "Type", key: "type" },
+  { label: "Path", key: "path" },
+  { label: "Preprocessing", key: "preprocessing" },
+  { label: "Event Timestamp Column", key: "event_timestamp_column" },
+  { label: "Timestamp Forma", key: "timestamp_format" },
+  { label: "Qualified Name", key: "qualified_name" },
+  { label: "Tags", key: "tags" },
+];
diff --git a/ui/src/utils/utils.tsx b/ui/src/utils/utils.tsx
index 85bfd8f42..9cd2c959b 100644
--- a/ui/src/utils/utils.tsx
+++ b/ui/src/utils/utils.tsx
@@ -1,3 +1,4 @@
+import { Feature } from "@/models/model";
 import { Configuration, PublicClientApplication } from "@azure/msal-browser";
 
 export const getMsalConfig = () => {
@@ -16,8 +17,6 @@ export const getMsalConfig = () => {
       redirectUri: window.location.origin,
     },
   };
-  console.log("clientId = ", clientId);
-  console.log("authority = ", authority);
 
   return new PublicClientApplication(msalConfig);
 };
@@ -33,6 +32,19 @@ export const enum FeatureType {
 export const isFeature = (featureType: string) => {
   return (
     featureType === FeatureType.AnchorFeature ||
-    featureType === FeatureType.DerivedFeature
+    featureType === FeatureType.DerivedFeature ||
+    featureType === FeatureType.Source
   );
 };
+
+export const getFeatureDetailUrl = (project: string, feature: Feature) => {
+  switch (feature.typeName) {
+    case FeatureType.Source:
+      return `/projects/${project}/dataSources/${feature.guid}`;
+    case FeatureType.AnchorFeature:
+    case FeatureType.DerivedFeature:
+      return `/projects/${project}/features/${feature.guid}`;
+    default:
+      return;
+  }
+};

From 02e3643b7dc3ecf3cfbccd41e3083b6b837fbe5e Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Tue, 1 Nov 2022 19:19:44 +0800
Subject: [PATCH 57/68] Add release instructions for Release Candidate (#809)

* Add release instructions for Release Candidate

* Add a section for release versioning

* Add a section for overall process triggered by the release manager
---
 .../dev_guide/feathr_overall_release_guide.md | 61 +++++++++++++------
 1 file changed, 43 insertions(+), 18 deletions(-)

diff --git a/docs/dev_guide/feathr_overall_release_guide.md b/docs/dev_guide/feathr_overall_release_guide.md
index d0b16611a..5d6301a49 100644
--- a/docs/dev_guide/feathr_overall_release_guide.md
+++ b/docs/dev_guide/feathr_overall_release_guide.md
@@ -10,62 +10,87 @@ This document describes all the release process for the development team.
 
 ## Prerequisites
 
-- Make sure the CI tests are passing so there are no surprises on the release day.
+- Make sure the CI tests are passing prior to bug bash.
 - Make sure all the active PRs related to the release are merged.
 
-
 ## When to Release
 
-- For each major and minor version release, please follow these steps.
-- For patch versions, there should be no releases.
+The release process is triggered by the release manager. The release manager will decide when to release with following steps:
+
+1. Ensure Prerequisites are met.
+2. Creation of Release Candidate(rc) on GitHub.
+3. Bug Bash.
+4. Creation of Release on GitHub.
+5. Post Release announcement.
+
+## Release Versioning
+
+- Major and minor version: X.Y.Z
+- Release Candidate: X.Y.Z-rcN
 
 ## Writing Release Note
 
 Write a release note following past examples [here](https://github.com/feathr-ai/feathr/releases).
 Read through the [commit log](https://github.com/feathr-ai/feathr/commits/main) to identify the commits after last release to include in the release note. Here are the major things to include
 
-- highlights of the release
-- improvements and changes of this release
-- new contributors of this release
+- Highlights of the release
+- Improvements and changes of this release
+- New contributors of this release
 
 ## Code Changes
-Before the release is made, the version needs to be updated in following places
+
+Before the release candidate or release is made, the version needs to be updated in following places
+
 - [build.sbt](https://github.com/feathr-ai/feathr/blob/main/build.sbt#L3) - For Maven release version
 - [version.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathr/version.py#L1) - For Feathr version
 - [conf.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/docs/conf.py#L27) - For documentation version
-- [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/test/test_user_workspace/feathr_config.yaml#L84) - To set the spark runtime location for Azure Synapse and Azure Databricks used by test suite. Please update all .yaml files under this path. 
-- [azure_resource_provision.json](https://github.com/feathr-ai/feathr/blob/main/docs/how-to-guides/azure_resource_provision.json#L114) - To set the deployment template to pull the latest release image.
-- [constants.py](https://github.com/feathr-ai/feathr/blob/main/feathr_project/feathr/constants.py#L31) - To set the default maven artifact version (Only needed when maven version is **NOT** the same as python sdk version)
+- [feathr_config.yaml](https://github.com/feathr-ai/feathr/blob/main/feathr_project/test/test_user_workspace/feathr_config.yaml#L84) - To set the spark runtime location for Azure Synapse and Azure Databricks used by test suite. Please update all .yaml files under this path.
 - [package.json](https://github.com/feathr-ai/feathr/blob/main/ui/package.json#L3) - For Feathr UI version
 
+Following file should only be updated for release, which means should be skipped for release candidate.
+
+- [azure_resource_provision.json](https://github.com/feathr-ai/feathr/blob/main/docs/how-to-guides/azure_resource_provision.json#L114) - To set the deployment template to pull the latest release image.
+
+## Release Branches
+
+Each major and minor release should have a release branch. The release branch should be named as `releases/vX.Y.Z` or `releases/vX.Y.Z-rcN` where `X.Y.Z` is the release version. The release branch should be created from the `main` branch. See past release branches [here](https://github.com/feathr-ai/feathr/branches/all?query=releases).
+
+## Release Tags
+
+Once the release branch is created, a release tag should be created from the release branch. The release tag should be named as `vX.Y.Z` or `vX.Y.Z-rcN` where `X.Y.Z` is the release version. See past release tags [here](https://github.com/feathr-ai/feathr/tags).
+
 ## Triggering automated release pipelines
-Our goal is to automate the release process as much as possible. So far, we have automated the following steps
-1. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/docker-publish.yml) to build and publish for our UI and API container to [dockerhub](https://hub.docker.com/r/feathrfeaturestore/feathr-registry/tags).
-    **Triggers** - Nightly, branch with name pattern "releases/*"
 
-1. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-pypi.yml) for publishing Python package to [PyPi](https://pypi.org/project/feathr/).
+Once the release branch and release tag are created, the release pipelines will be triggered automatically. The release pipelines will build the release artifacts and publish them to Maven and PyPI.
+
+1. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/docker-publish.yml) to build and publish for Feathr Registry docker images to [DockerHub](https://hub.docker.com/r/feathrfeaturestore/feathr-registry/tags).
 
-    **Triggers** -  branch with name pattern "releases/*"
+    **Triggers** - Nightly or branch with name pattern "releases/*"
 
-1. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-maven.yml) for publishing the jar to [maven/sonatype repository](https://oss.sonatype.org/).
+2. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-pypi.yml) for publishing Python package to [PyPi](https://pypi.org/project/feathr/).
 
-**PLEASE NOTE: To trigger the above workflows as part of release, create a new branch with pattern releases/v0.x.0**. See past release branches [here](https://github.com/feathr-ai/feathr/branches/all?query=releases).
+    **Triggers** - branch with name pattern "releases/*"
 
+3. Automated [workflow](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-maven.yml) for publishing the jar to [maven/sonatype repository](https://oss.sonatype.org/).
 
 ## Upload Feathr Jar
 
 Run the command to generate the Java jar. After the jar is generated, please upload to [Azure storage](https://ms.portal.azure.com/#view/Microsoft_Azure_Storage/ContainerMenuBlade/~/overview/storageAccountId/%2Fsubscriptions%2Fa6c2a7cc-d67e-4a1a-b765-983f08c0423a%2FresourceGroups%2Fazurefeathrintegration%2Fproviders%2FMicrosoft.Storage%2FstorageAccounts%2Fazurefeathrstorage/path/public/etag/%220x8D9E6F64D62D599%22/defaultEncryptionScope/%24account-encryption-key/denyEncryptionScopeOverride//defaultId//publicAccessVal/Container) for faster access.
 
 ## Release PyPi
+
 The automated workflow should take care of this, you can check under [actions](https://github.com/feathr-ai/feathr/actions/workflows/publish-to-pypi.yml) to see the triggered run and results. For manual steps, see [Python Package Release Guide](https://feathr-ai.github.io/feathr/dev_guide/python_package_release.html)
 
 ## Updating docker image for API and Registry
+
 The automated workflow should take care of this as well, you can check under [actions](https://github.com/feathr-ai/feathr/actions/workflows/docker-publish.yml) to see the triggered run and results. For manual steps, see [Feathr Registry docker image](https://feathr-ai.github.io/feathr/dev_guide/build-and-push-feathr-registry-docker-image.html)
 
 ## Release Maven
+
 The automated workflow should take of this too, you can check under [actions](https://github.com/feathr-ai/feathr/blob/main/.github/workflows/publish-to-maven.yml) to see the triggered run and results. For manual steps, see [Feathr Developer Guide for publishing to maven](https://feathr-ai.github.io/feathr/dev_guide/publish_to_maven.html)
 
 ## Testing
+
 Run one of the sample [notebook](https://github.com/feathr-ai/feathr/blob/main/docs/samples/azure_synapse/product_recommendation_demo.ipynb) as it uses the latest package from Maven and PyPi.
 
 ## Announcement

From 244f1279c309fc5425fbc47e90886e1af4400072 Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Tue, 1 Nov 2022 20:26:40 +0800
Subject: [PATCH 58/68] Bump version to 0.9.0-rc1 (#810)

---
 build.sbt                                                     | 2 +-
 docs/how-to-guides/local-spark-provider.md                    | 2 +-
 feathr_project/feathr/version.py                              | 2 +-
 feathr_project/test/test_user_workspace/feathr_config.yaml    | 4 ++--
 .../test_user_workspace/feathr_config_registry_purview.yaml   | 4 ++--
 .../feathr_config_registry_purview_rbac.yaml                  | 4 ++--
 .../test/test_user_workspace/feathr_config_registry_sql.yaml  | 4 ++--
 .../test_user_workspace/feathr_config_registry_sql_rbac.yaml  | 4 ++--
 ui/package.json                                               | 2 +-
 9 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/build.sbt b/build.sbt
index 2919ddae6..2ad413ba2 100644
--- a/build.sbt
+++ b/build.sbt
@@ -2,7 +2,7 @@ import sbt.Keys.publishLocalConfiguration
 
 ThisBuild / resolvers += Resolver.mavenLocal
 ThisBuild / scalaVersion     := "2.12.15"
-ThisBuild / version          := "0.8.0"
+ThisBuild / version          := "0.9.0-rc1"
 ThisBuild / organization     := "com.linkedin.feathr"
 ThisBuild / organizationName := "linkedin"
 val sparkVersion = "3.1.3"
diff --git a/docs/how-to-guides/local-spark-provider.md b/docs/how-to-guides/local-spark-provider.md
index 433af64f3..0069322b8 100644
--- a/docs/how-to-guides/local-spark-provider.md
+++ b/docs/how-to-guides/local-spark-provider.md
@@ -36,7 +36,7 @@ A spark-submit script will auto generated in your workspace under `debug` folder
 spark-submit \
         --master local[*] \
         --name project_feathr_local_spark_test \
-        --packages "org.apache.spark:spark-avro_2.12:3.3.0,com.microsoft.sqlserver:mssql-jdbc:10.2.0.jre8,com.microsoft.azure:spark-mssql-connector_2.12:1.2.0,org.apache.logging.log4j:log4j-core:2.17.2,com.typesafe:config:1.3.4,com.fasterxml.jackson.core:jackson-databind:2.12.6.1,org.apache.hadoop:hadoop-mapreduce-client-core:2.7.7,org.apache.hadoop:hadoop-common:2.7.7,org.apache.avro:avro:1.8.2,org.apache.xbean:xbean-asm6-shaded:4.10,org.apache.spark:spark-sql-kafka-0-10_2.12:3.1.3,com.microsoft.azure:azure-eventhubs-spark_2.12:2.3.21,org.apache.kafka:kafka-clients:3.1.0,com.google.guava:guava:31.1-jre,it.unimi.dsi:fastutil:8.1.1,org.mvel:mvel2:2.2.8.Final,com.fasterxml.jackson.module:jackson-module-scala_2.12:2.13.3,com.fasterxml.jackson.dataformat:jackson-dataformat-yaml:2.12.6,com.fasterxml.jackson.dataformat:jackson-dataformat-csv:2.12.6,com.jasonclawson:jackson-dataformat-hocon:1.1.0,com.redislabs:spark-redis_2.12:3.1.0,org.apache.xbean:xbean-asm6-shaded:4.10,com.google.protobuf:protobuf-java:3.19.4,net.snowflake:snowflake-jdbc:3.13.18,net.snowflake:spark-snowflake_2.12:2.10.0-spark_3.2,org.apache.commons:commons-lang3:3.12.0,org.xerial:sqlite-jdbc:3.36.0.3,com.github.changvvb:jackson-module-caseclass_2.12:1.1.1,com.azure.cosmos.spark:azure-cosmos-spark_3-1_2-12:4.11.1,org.eclipse.jetty:jetty-util:9.3.24.v20180605,commons-io:commons-io:2.6,org.apache.hadoop:hadoop-azure:2.7.4,com.microsoft.azure:azure-storage:8.6.4,com.linkedin.feathr:feathr_2.12:0.8.0" \
+        --packages "org.apache.spark:spark-avro_2.12:3.3.0,com.microsoft.sqlserver:mssql-jdbc:10.2.0.jre8,com.microsoft.azure:spark-mssql-connector_2.12:1.2.0,org.apache.logging.log4j:log4j-core:2.17.2,com.typesafe:config:1.3.4,com.fasterxml.jackson.core:jackson-databind:2.12.6.1,org.apache.hadoop:hadoop-mapreduce-client-core:2.7.7,org.apache.hadoop:hadoop-common:2.7.7,org.apache.avro:avro:1.8.2,org.apache.xbean:xbean-asm6-shaded:4.10,org.apache.spark:spark-sql-kafka-0-10_2.12:3.1.3,com.microsoft.azure:azure-eventhubs-spark_2.12:2.3.21,org.apache.kafka:kafka-clients:3.1.0,com.google.guava:guava:31.1-jre,it.unimi.dsi:fastutil:8.1.1,org.mvel:mvel2:2.2.8.Final,com.fasterxml.jackson.module:jackson-module-scala_2.12:2.13.3,com.fasterxml.jackson.dataformat:jackson-dataformat-yaml:2.12.6,com.fasterxml.jackson.dataformat:jackson-dataformat-csv:2.12.6,com.jasonclawson:jackson-dataformat-hocon:1.1.0,com.redislabs:spark-redis_2.12:3.1.0,org.apache.xbean:xbean-asm6-shaded:4.10,com.google.protobuf:protobuf-java:3.19.4,net.snowflake:snowflake-jdbc:3.13.18,net.snowflake:spark-snowflake_2.12:2.10.0-spark_3.2,org.apache.commons:commons-lang3:3.12.0,org.xerial:sqlite-jdbc:3.36.0.3,com.github.changvvb:jackson-module-caseclass_2.12:1.1.1,com.azure.cosmos.spark:azure-cosmos-spark_3-1_2-12:4.11.1,org.eclipse.jetty:jetty-util:9.3.24.v20180605,commons-io:commons-io:2.6,org.apache.hadoop:hadoop-azure:2.7.4,com.microsoft.azure:azure-storage:8.6.4,com.linkedin.feathr:feathr_2.12:0.9.0-rc1" \
         --conf "spark.driver.extraClassPath=../target/scala-2.12/classes:jars/config-1.3.4.jar:jars/jackson-dataformat-hocon-1.1.0.jar:jars/jackson-module-caseclass_2.12-1.1.1.jar:jars/mvel2-2.2.8.Final.jar:jars/fastutil-8.1.1.jar" \
         --conf "spark.hadoop.fs.wasbs.impl=org.apache.hadoop.fs.azure.NativeAzureFileSystem" \
         --class com.linkedin.feathr.offline.job.FeatureJoinJob \
diff --git a/feathr_project/feathr/version.py b/feathr_project/feathr/version.py
index 807119de6..f31e00e36 100644
--- a/feathr_project/feathr/version.py
+++ b/feathr_project/feathr/version.py
@@ -1 +1 @@
-__version__ = "0.8.0"
\ No newline at end of file
+__version__ = "0.9.0-rc1"
\ No newline at end of file
diff --git a/feathr_project/test/test_user_workspace/feathr_config.yaml b/feathr_project/test/test_user_workspace/feathr_config.yaml
index e67c803ef..f463785d5 100644
--- a/feathr_project/test/test_user_workspace/feathr_config.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config.yaml
@@ -82,7 +82,7 @@ spark_config:
     # Feathr Job configuration. Support local paths, path start with http(s)://, and paths start with abfs(s)://
     # this is the default location so end users don't have to compile the runtime again.
     # feathr_runtime_location: wasbs://public@azurefeathrstorage.blob.core.windows.net/feathr-assembly-LATEST.jar
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
   databricks:
     # workspace instance
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
@@ -93,7 +93,7 @@ spark_config:
     # Feathr Job location. Support local paths, path start with http(s)://, and paths start with dbfs:/
     work_dir: 'dbfs:/feathr_getting_started'
     # this is the default location so end users don't have to compile the runtime again.
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
index f716da0b4..b6e3aacde 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
index c842bc702..ffef212d2 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
index dcb73d827..8f6691725 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
index 29c6889e8..03c5f75f1 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.8.0.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
 
 online_store:
   redis:
diff --git a/ui/package.json b/ui/package.json
index da870fbf3..b4e1ce820 100644
--- a/ui/package.json
+++ b/ui/package.json
@@ -1,6 +1,6 @@
 {
   "name": "feathr-ui",
-  "version": "0.8.0",
+  "version": "0.9.0-rc1",
   "private": true,
   "dependencies": {
     "@ant-design/icons": "^4.7.0",

From ded4cae0a99275bebace29e0777576af3f2d7e7d Mon Sep 17 00:00:00 2001
From: bozhonghu <bozhonghu@gmail.com>
Date: Tue, 1 Nov 2022 15:34:07 -0700
Subject: [PATCH 59/68] Fix bug in empty array dense tensor default value
 (#806)

Co-authored-by: Bozhong Hu <bobhu@linkedin.com>
---
 .../DefaultValueSubstituter.scala             |  2 +-
 .../offline/AnchoredFeaturesIntegTest.scala   | 19 ++++++++++++++++++-
 2 files changed, 19 insertions(+), 2 deletions(-)

diff --git a/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala b/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala
index 1b67d9558..bf5d70c75 100644
--- a/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/transformation/DefaultValueSubstituter.scala
@@ -112,7 +112,7 @@ private[offline] object DataFrameDefaultValueSubstituter extends DataFrameDefaul
         // For tensor default, since we don't have type, so we need to use expr to construct the default column
         val schema = field.dataType
         val tensorData = defaultFeatureValue.getAsTensorData
-        val ts = FeaturizedDatasetUtils.tensorToFDSDataFrameRow(tensorData)
+        val ts = FeaturizedDatasetUtils.tensorToFDSDataFrameRow(tensorData, Some(schema))
         val fdsTensorDefaultUDF = getFDSTensorDefaultUDF(schema, ts)
         ss.udf.register("tz_udf", fdsTensorDefaultUDF)
         expr(s"tz_udf($featureColumnName)")
diff --git a/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala b/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala
index 061b42598..db69ea6f2 100644
--- a/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala
+++ b/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala
@@ -58,6 +58,16 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
       |       type: "DENSE_VECTOR"
       |       default: [7,8,9]
       |      }
+      |      ee2: {
+      |       def: "c"
+      |       type: {
+      |           type: TENSOR
+      |           tensorCategory: DENSE
+      |           dimensionType: [INT]
+      |           valType: FLOAT
+      |           }
+      |       default: []
+      |      }
       |      ff: {
       |       def: "c"
       |       default: [6,7]
@@ -155,7 +165,7 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
    */
   @Test
   def testSingleKeyJoinWithDifferentFeatureTypes(): Unit = {
-    val selectedColumns = Seq("x", "aa", "bb", "cc", "dd", "ee", "ff", "multiply_a_b", "categorical_b") // , "z")
+    val selectedColumns = Seq("x", "aa", "bb", "cc", "dd", "ee", "ee2", "ff", "multiply_a_b", "categorical_b") // , "z")
     val featureJoinConf =
       s"""
          |
@@ -186,6 +196,8 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
             null,
             // ee
             mutable.WrappedArray.make(Array(7.0f, 8.0f, 9.0f)),
+            // ee2
+            mutable.WrappedArray.empty,
             // ff
             mutable.WrappedArray.make(Array(6.0f, 7.0f)),
             // multiply_a_b
@@ -207,6 +219,8 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
             mutable.WrappedArray.make(Array(1.0f, 2.0f, 3.0f)),
             // ee
             mutable.WrappedArray.make(Array(1.0f, 2.0f, 3.0f)),
+            // ee2
+            mutable.WrappedArray.make(Array(1.0f, 2.0f, 3.0f)),
             // ff
             mutable.WrappedArray.make(Array(1.0f, 2.0f, 3.0f)),
             // multiply_a_b
@@ -228,6 +242,8 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
             mutable.WrappedArray.make(Array(4.0f, 5.0f, 6.0f)),
             // ee
             mutable.WrappedArray.make(Array(4.0f, 5.0f, 6.0f)),
+            // ee2
+            mutable.WrappedArray.make(Array(4.0f, 5.0f, 6.0f)),
             // ff
             mutable.WrappedArray.make(Array(4.0f, 5.0f, 6.0f)),
             // multiply_a_b
@@ -246,6 +262,7 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
           StructField("cc", FloatType, true),
           StructField("dd", ArrayType(FloatType, true), true),
           StructField("ee", ArrayType(FloatType, false), true),
+          StructField("ee2", ArrayType(FloatType, false), true),
           StructField("ff", ArrayType(FloatType, false), true),
           StructField(
             "multiply_a_b",

From edd00f6a492050ad6c9c9bed551ee6892ac35bf5 Mon Sep 17 00:00:00 2001
From: Jinghui Mo <jmo@linkedin.com>
Date: Tue, 1 Nov 2022 18:37:53 -0400
Subject: [PATCH 60/68] Fix sql-based derived feature (#812)

---
 .../derived/DerivedFeatureEvaluator.scala     |  19 ++-
 .../strategies/DerivationStrategies.scala     |  11 +-
 .../strategies/SqlDerivationSpark.scala       | 107 +++++++++++++
 .../DataFrameFeatureGenerator.scala           |   6 +-
 .../feathr/offline/DerivationsIntegTest.scala | 146 ++++++++++++++++++
 5 files changed, 277 insertions(+), 12 deletions(-)
 create mode 100644 src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala
 create mode 100644 src/test/scala/com/linkedin/feathr/offline/DerivationsIntegTest.scala

diff --git a/src/main/scala/com/linkedin/feathr/offline/derived/DerivedFeatureEvaluator.scala b/src/main/scala/com/linkedin/feathr/offline/derived/DerivedFeatureEvaluator.scala
index ff16ebe18..59dd8ea8e 100644
--- a/src/main/scala/com/linkedin/feathr/offline/derived/DerivedFeatureEvaluator.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/derived/DerivedFeatureEvaluator.scala
@@ -1,19 +1,19 @@
 package com.linkedin.feathr.offline.derived
 
-import com.linkedin.feathr.{common, offline}
-import com.linkedin.feathr.common.{FeatureDerivationFunction, FeatureTypeConfig}
 import com.linkedin.feathr.common.exception.{ErrorLabel, FeathrException}
-import com.linkedin.feathr.offline.{ErasedEntityTaggedFeature, FeatureDataFrame}
+import com.linkedin.feathr.common.{FeatureDerivationFunction, FeatureTypeConfig}
 import com.linkedin.feathr.offline.client.DataFrameColName
 import com.linkedin.feathr.offline.client.plugins.{FeathrUdfPluginContext, FeatureDerivationFunctionAdaptor}
-import com.linkedin.feathr.offline.derived.functions.{MvelFeatureDerivationFunction, SeqJoinDerivationFunction}
-import com.linkedin.feathr.offline.derived.strategies.{DerivationStrategies, RowBasedDerivation, SequentialJoinAsDerivation, SparkUdfDerivation}
+import com.linkedin.feathr.offline.derived.functions.{MvelFeatureDerivationFunction, SQLFeatureDerivationFunction, SeqJoinDerivationFunction}
+import com.linkedin.feathr.offline.derived.strategies._
 import com.linkedin.feathr.offline.join.algorithms.{SequentialJoinConditionBuilder, SparkJoinWithJoinCondition}
 import com.linkedin.feathr.offline.logical.FeatureGroups
 import com.linkedin.feathr.offline.mvel.plugins.FeathrExpressionExecutionContext
-import com.linkedin.feathr.offline.util.FeaturizedDatasetUtils
 import com.linkedin.feathr.offline.source.accessor.DataPathHandler
+import com.linkedin.feathr.offline.util.FeaturizedDatasetUtils
+import com.linkedin.feathr.offline.{ErasedEntityTaggedFeature, FeatureDataFrame}
 import com.linkedin.feathr.sparkcommon.FeatureDerivationFunctionSpark
+import com.linkedin.feathr.{common, offline}
 import org.apache.log4j.Logger
 import org.apache.spark.sql.{DataFrame, SparkSession}
 
@@ -45,6 +45,9 @@ private[offline] class DerivedFeatureEvaluator(derivationStrategies: DerivationS
       case h: FeatureDerivationFunctionSpark =>
         val resultDF = derivationStrategies.customDerivationSparkStrategy(keyTag, keyTagList, contextDF, derivedFeature, h, mvelContext)
         convertFeatureColumnToQuinceFds(producedFeatureColName, derivedFeature, resultDF)
+      case s: SQLFeatureDerivationFunction =>
+        val resultDF = derivationStrategies.sqlDerivationSparkStrategy(keyTag, keyTagList, contextDF, derivedFeature, s, mvelContext)
+        convertFeatureColumnToQuinceFds(producedFeatureColName, derivedFeature, resultDF)
       case x: FeatureDerivationFunction =>
         // We should do the FDS conversion inside the rowBasedDerivationStrategy here. The result of rowBasedDerivationStrategy
         // can be NTV FeatureValue or TensorData-based Feature. NTV FeatureValue has fixed FDS schema. However, TensorData
@@ -118,8 +121,8 @@ private[offline] object DerivedFeatureEvaluator {
     val defaultStrategies = strategies.DerivationStrategies(
       new SparkUdfDerivation(),
       new RowBasedDerivation(featureGroups.allTypeConfigs, mvelContext),
-      new SequentialJoinAsDerivation(ss, featureGroups, SparkJoinWithJoinCondition(SequentialJoinConditionBuilder), dataPathHandlers)
-      )
+      new SequentialJoinAsDerivation(ss, featureGroups, SparkJoinWithJoinCondition(SequentialJoinConditionBuilder), dataPathHandlers),
+      new SqlDerivationSpark())
     new DerivedFeatureEvaluator(defaultStrategies, mvelContext)
   }
 
diff --git a/src/main/scala/com/linkedin/feathr/offline/derived/strategies/DerivationStrategies.scala b/src/main/scala/com/linkedin/feathr/offline/derived/strategies/DerivationStrategies.scala
index e54d68f59..13fbec9c7 100644
--- a/src/main/scala/com/linkedin/feathr/offline/derived/strategies/DerivationStrategies.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/derived/strategies/DerivationStrategies.scala
@@ -1,8 +1,8 @@
 package com.linkedin.feathr.offline.derived.strategies
 
 import com.linkedin.feathr.common.{FeatureDerivationFunction, FeatureDerivationFunctionBase}
-import com.linkedin.feathr.offline.derived.functions.SeqJoinDerivationFunction
 import com.linkedin.feathr.offline.derived.DerivedFeature
+import com.linkedin.feathr.offline.derived.functions.{SQLFeatureDerivationFunction, SeqJoinDerivationFunction}
 import com.linkedin.feathr.offline.mvel.plugins.FeathrExpressionExecutionContext
 import com.linkedin.feathr.sparkcommon.FeatureDerivationFunctionSpark
 import org.apache.spark.sql.DataFrame
@@ -41,10 +41,17 @@ private[offline] trait RowBasedDerivationStrategy extends DerivationStrategy[Fea
  */
 private[offline] trait SequentialJoinDerivationStrategy extends DerivationStrategy[SeqJoinDerivationFunction]
 
+/**
+ * Implementation should define how a SQL-expression based derivation is evaluated.
+ */
+private[offline] trait SqlDerivationSparkStrategy extends DerivationStrategy[SQLFeatureDerivationFunction]
+
 /**
  * This case class holds the implementations of supported strategies.
  */
 private[offline] case class DerivationStrategies(
     customDerivationSparkStrategy: SparkUdfDerivationStrategy,
     rowBasedDerivationStrategy: RowBasedDerivationStrategy,
-    sequentialJoinDerivationStrategy: SequentialJoinDerivationStrategy)
+    sequentialJoinDerivationStrategy: SequentialJoinDerivationStrategy,
+    sqlDerivationSparkStrategy: SqlDerivationSparkStrategy) {
+}
diff --git a/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala b/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala
new file mode 100644
index 000000000..3afa0a6af
--- /dev/null
+++ b/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala
@@ -0,0 +1,107 @@
+package com.linkedin.feathr.offline.derived.strategies
+
+import com.linkedin.feathr.common.exception.{ErrorLabel, FeathrFeatureTransformationException}
+import com.linkedin.feathr.offline.client.DataFrameColName
+import com.linkedin.feathr.offline.derived.DerivedFeature
+import com.linkedin.feathr.offline.derived.functions.SQLFeatureDerivationFunction
+import com.linkedin.feathr.offline.mvel.plugins.FeathrExpressionExecutionContext
+import org.apache.spark.sql.functions.expr
+import org.apache.spark.sql.{DataFrame, SparkSession}
+
+import scala.collection.JavaConverters._
+
+/**
+ * This class executes SQL-expression based derived feature.
+ */
+class SqlDerivationSpark extends SqlDerivationSparkStrategy {
+
+
+  /**
+   * Rewrite sqlExpression for a derived feature, e.g, replace the feature name/argument name with Frame internal dataframe column name
+   * @param deriveFeature derived feature definition
+   * @param keyTag list of tags represented by integer
+   * @param keyTagId2StringMap Map from the tag integer id to the string tag
+   * @return Rewritten SQL expression
+   */
+  private[offline] def rewriteDerivedFeatureExpression(
+                                                        deriveFeature: DerivedFeature,
+                                                        keyTag:  Seq[Int],
+                                                        keyTagId2StringMap: Seq[String]): String = {
+    if (!deriveFeature.derivation.isInstanceOf[SQLFeatureDerivationFunction]) {
+      throw new FeathrFeatureTransformationException(ErrorLabel.FEATHR_ERROR, "Should not rewrite derived feature expression for non-SQLDerivedFeatures")
+    }
+    val sqlDerivation = deriveFeature.derivation.asInstanceOf[SQLFeatureDerivationFunction]
+    val deriveExpr = sqlDerivation.getExpression()
+    val parameterNames: Seq[String] = sqlDerivation.getParameterNames().getOrElse(Seq[String]())
+    val consumedFeatureNames = deriveFeature.consumedFeatureNames.zipWithIndex.map {
+      case (consumeFeatureName, index) =>
+        // begin of string, or other char except number and alphabet
+        // val featureStartPattern = """(^|[^a-zA-Z0-9])"""
+        // end of string, or other char except number and alphabet
+        // val featureEndPattern = """($|[^a-zA-Z0-9])"""
+        val namePattern = if (parameterNames.isEmpty) consumeFeatureName.getFeatureName else parameterNames(index)
+        // getBinding.map(keyTag.get) resolves the call tags
+        val newName =
+          if (!consumeFeatureName.getBinding.isEmpty // Passthrough features do not have keyTag
+            // Feature generation code path does not create columns with tags.
+            // The check ensures we do not run into IndexOutOfBoundsException when keyTag & keyTagId2StringMap are empty.
+            && keyTag.nonEmpty
+            && keyTagId2StringMap.nonEmpty) {
+            DataFrameColName.genFeatureColumnName(
+              consumeFeatureName.getFeatureName,
+              Some(consumeFeatureName.getBinding.asScala.map(keyTag(_)).map(keyTagId2StringMap)))
+          } else {
+            DataFrameColName.genFeatureColumnName(consumeFeatureName.getFeatureName)
+          }
+        (namePattern, newName)
+    }.toMap
+
+    // replace all feature name to column names
+    // featureName is consist of numAlphabetic
+    val ss: SparkSession = SparkSession.builder().getOrCreate()
+    val dependencyFeatures = ss.sessionState.sqlParser.parseExpression(deriveExpr).references.map(_.name).toSeq
+    // \w is [a-zA-Z0-9_], not inclusion of _ and exclusion of -, as - is ambiguous, e.g, a-b could be a feature name or feature a minus feature b
+    val rewrittenExpr = dependencyFeatures.foldLeft(deriveExpr)((acc, ca) => {
+      // in scala \W does not work as ^\w
+      // "a+B+1".replaceAll("([^\w])B([^\w])", "$1abc$2"     =  A+abc+1
+      // "a+B".replaceAll("([^\w])B$", "$1abc"         = a+abc
+      // "B+1".replaceAll("^B([^\w])", "abc$1"   = abc+1
+      // "B".replaceAll("^B$", "abc"  = abc
+      val newVal = consumedFeatureNames.getOrElse(ca, ca)
+      val patterns = Seq("([^\\w])" + ca + "([^\\w])", "([^\\w])" + ca + "$", "^" + ca + "([^\\w])", "^" + ca + "$")
+      val replacements = Seq("$1" + newVal + "$2", "$1" + newVal, newVal + "$1", newVal)
+      val replacedExpr = patterns
+        .zip(replacements)
+        .toMap
+        .foldLeft(acc)((orig, pairs) => {
+          orig.replaceAll(pairs._1, pairs._2)
+        })
+      replacedExpr
+    })
+    rewrittenExpr
+  }
+
+  /**
+   * Apply the derivation strategy.
+   *
+   * @param keyTags            keyTags for the derived feature.
+   * @param keyTagList         integer keyTag to string keyTag map.
+   * @param df                 input DataFrame.
+   * @param derivedFeature     Derived feature metadata.
+   * @param derivationFunction Derivation function to evaluate the derived feature
+   * @return output DataFrame with derived feature.
+   */
+  override def apply(keyTags: Seq[Int],
+                      keyTagList: Seq[String],
+                      df: DataFrame,
+                      derivedFeature: DerivedFeature,
+                      derivationFunction: SQLFeatureDerivationFunction,
+                      mvelContext: Option[FeathrExpressionExecutionContext]): DataFrame = {
+    // sql expression based derived feature needs rewrite, e.g, replace the feature names with feature column names in the dataframe
+    val rewrittenExpr = rewriteDerivedFeatureExpression(derivedFeature, keyTags, keyTagList)
+    val tags = Some(keyTags.map(keyTagList).toList)
+    val featureColumnName = DataFrameColName.genFeatureColumnName(derivedFeature.producedFeatureNames.head, tags)
+    df.withColumn(featureColumnName, expr(rewrittenExpr))
+  }
+
+}
diff --git a/src/main/scala/com/linkedin/feathr/offline/generation/DataFrameFeatureGenerator.scala b/src/main/scala/com/linkedin/feathr/offline/generation/DataFrameFeatureGenerator.scala
index 310c3931e..57f4def55 100644
--- a/src/main/scala/com/linkedin/feathr/offline/generation/DataFrameFeatureGenerator.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/generation/DataFrameFeatureGenerator.scala
@@ -5,7 +5,7 @@ import com.linkedin.feathr.common.{Header, JoiningFeatureParams, TaggedFeatureNa
 import com.linkedin.feathr.offline
 import com.linkedin.feathr.offline.anchored.feature.FeatureAnchorWithSource.{getDefaultValues, getFeatureTypes}
 import com.linkedin.feathr.offline.derived.functions.SeqJoinDerivationFunction
-import com.linkedin.feathr.offline.derived.strategies.{DerivationStrategies, RowBasedDerivation, SequentialJoinDerivationStrategy, SparkUdfDerivation}
+import com.linkedin.feathr.offline.derived.strategies.{DerivationStrategies, RowBasedDerivation, SequentialJoinDerivationStrategy, SparkUdfDerivation, SqlDerivationSpark}
 import com.linkedin.feathr.offline.derived.{DerivedFeature, DerivedFeatureEvaluator}
 import com.linkedin.feathr.offline.evaluator.DerivedFeatureGenStage
 import com.linkedin.feathr.offline.job.{FeatureGenSpec, FeatureTransformation}
@@ -133,5 +133,7 @@ private[offline] class DataFrameFeatureGenerator(logicalPlan: MultiStageJoinPlan
               ErrorLabel.FEATHR_ERROR,
               s"Feature Generation does not support Sequential Join features : ${derivedFeature.producedFeatureNames.head}")
           }
-        }), mvelContext)
+        },
+        new SqlDerivationSpark()
+      ), mvelContext)
 }
diff --git a/src/test/scala/com/linkedin/feathr/offline/DerivationsIntegTest.scala b/src/test/scala/com/linkedin/feathr/offline/DerivationsIntegTest.scala
new file mode 100644
index 000000000..94e92e06d
--- /dev/null
+++ b/src/test/scala/com/linkedin/feathr/offline/DerivationsIntegTest.scala
@@ -0,0 +1,146 @@
+package com.linkedin.feathr.offline
+
+import com.linkedin.feathr.offline.util.FeathrTestUtils.assertDataFrameApproximatelyEquals
+import org.apache.spark.sql.Row
+import org.apache.spark.sql.types._
+import org.testng.annotations.Test
+
+class DerivationsIntegTest extends FeathrIntegTest {
+
+  /**
+   * Test multi-key derived feature and multi-tagged feature.
+   * This test covers the following:-
+   * -> sql based custom extractor
+   */
+  @Test
+  def testMultiKeyDerivedFeatureDFWithSQL: Unit = {
+    val df = runLocalFeatureJoinForTest(
+      joinConfigAsString = """
+                             | features: [ {
+                             |   key: ["concat('',viewer)", viewee]
+                             |   featureList: [ "foo_square_distance_sql"]
+                             | } ,
+                             |  {
+                             |   key: [viewee, viewer]
+                             |   featureList: [ "foo_square_distance_sql"]
+                             | },
+                             | {
+                             |   key: [viewee, viewer]
+                             |   featureList: [ "square_fooFeature_sql"]
+                             | }
+                             | ]
+      """.stripMargin,
+      featureDefAsString = """
+                             | anchors: {
+                             |   anchor1: {
+                             |     source: anchorAndDerivations/derivations/anchor6-source.csv
+                             |     key.sqlExpr: [sourceId, destId]
+                             |     features: {
+                             |       fooFeature: {
+                             |         def.sqlExpr: cast(source as int)
+                             |         type: NUMERIC
+                             |       }
+                             |     }
+                             |   }
+                             | }
+                             | derivations: {
+                             |
+                             |   square_fooFeature_sql: {
+                             |     key: [m1, m2]
+                             |     inputs: {
+                             |       a: { key: [m1, m2], feature: fooFeature }
+                             |     }
+                             |     definition.sqlExpr: "a * a"
+                             |   }
+                             |   foo_square_distance_sql: {
+                             |     key: [m1, m2]
+                             |     inputs: {
+                             |       a1: { key: [m1, m2], feature: square_fooFeature_sql }
+                             |       a2: { key: [m2, m1], feature: square_fooFeature_sql }
+                             |     }
+                             |     definition.sqlExpr: "a1 - a2"
+                             |   }
+                             | }
+        """.stripMargin,
+      observationDataPath = "anchorAndDerivations/derivations/test2-observations.csv")
+
+    val expectedDf = ss.createDataFrame(
+      ss.sparkContext.parallelize(
+        Seq(
+          Row(
+            // viewer
+            "1",
+            // viewee
+            "3",
+            // label
+            "1.0",
+            // square_fooFeature_sql
+            4.0f,
+            // viewee_viewer__foo_square_distance_sql
+            -21.0f,
+            // concat____viewer__viewee__foo_square_distance_sql
+            21.0f),
+          Row(
+            // viewer
+            "2",
+            // viewee
+            "1",
+            // label
+            "-1.0",
+            // square_fooFeature_sql
+            9.0f,
+            // viewee_viewer__foo_square_distance_sql
+            -27.0f,
+            // concat____viewer__viewee__foo_square_distance_sql
+            27.0f),
+          Row(
+            // viewer
+            "3",
+            // viewee
+            "6",
+            // label
+            "1.0",
+            // square_fooFeature_sql
+            null,
+            // viewee_viewer__foo_square_distance_sql
+            null,
+            // concat____viewer__viewee__foo_square_distance_sql
+            null),
+          Row(
+            // viewer
+            "3",
+            // viewee
+            "5",
+            // label
+            "-1.0",
+            // square_fooFeature_sql
+            null,
+            // viewee_viewer__foo_square_distance_sql
+            null,
+            // concat____viewer__viewee__foo_square_distance_sql
+            null),
+          Row(
+            // viewer
+            "5",
+            // viewee
+            "10",
+            // label
+            "1.0",
+            // square_fooFeature_sql
+            null,
+            // viewee_viewer__foo_square_distance_sql
+            null,
+            // concat____viewer__viewee__foo_square_distance_sql
+            null))),
+      StructType(
+        List(
+          StructField("viewer", StringType, true),
+          StructField("viewee", StringType, true),
+          StructField("label", StringType, true),
+          StructField("square_fooFeature_sql", FloatType, true),
+          StructField("viewee_viewer__foo_square_distance_sql", FloatType, true),
+          StructField("concat____viewer__viewee__foo_square_distance_sql", FloatType, true))))
+    def cmpFunc(row: Row): String = if (row.get(0) != null) row.get(0).toString else "null"
+    assertDataFrameApproximatelyEquals(df.data, expectedDf, cmpFunc)
+  }
+}

From f83e8f50735c00eafa386fe22b46e3d3083a276a Mon Sep 17 00:00:00 2001
From: Richin Jain <rijai@microsoft.com>
Date: Wed, 2 Nov 2022 15:00:43 +0530
Subject: [PATCH 61/68] Replacing webapp-deploy action with workflow-webhook
 action. (#813)

* Replacing the web app deploy (which is buggy) with a simpler action that calls the webhook URL of the deployed App Service

* Using the latest version of webhook and corresponding fields with it, this version makes the webhook_secret optional
---
 .github/workflows/docker-publish.yml | 31 +++++++++++-----------------
 1 file changed, 12 insertions(+), 19 deletions(-)

diff --git a/.github/workflows/docker-publish.yml b/.github/workflows/docker-publish.yml
index 84e99b614..3046cdf15 100644
--- a/.github/workflows/docker-publish.yml
+++ b/.github/workflows/docker-publish.yml
@@ -52,27 +52,20 @@ jobs:
     
     
     steps:
-      - name: Deploy to Feathr SQL Registry Azure Web App
-        id: deploy-to-sql-webapp
-        uses: azure/webapps-deploy@v2
-        with:
-          app-name: 'feathr-sql-registry'
-          publish-profile: ${{ secrets.AZURE_WEBAPP_PUBLISH_PROFILE_FEATHR_SQL_REGISTRY }}
-          images: 'feathrfeaturestore/feathr-registry:nightly'
-    
       - name: Deploy to Feathr Purview Registry Azure Web App
         id: deploy-to-purview-webapp
-        uses: azure/webapps-deploy@v2
-        with:
-          app-name: 'feathr-purview-registry'
-          publish-profile: ${{ secrets.AZURE_WEBAPP_PUBLISH_PROFILE_FEATHR_PURVIEW_REGISTRY }}
-          images: 'feathrfeaturestore/feathr-registry:nightly'
+        uses: distributhor/workflow-webhook@v3.0.1
+        env:
+          webhook_url: ${{ secrets.AZURE_WEBAPP_FEATHR_PURVIEW_REGISTRY_WEBHOOK }}
 
       - name: Deploy to Feathr RBAC Registry Azure Web App
         id: deploy-to-rbac-webapp
-        uses: azure/webapps-deploy@v2
-        with:
-          app-name: 'feathr-rbac-registry'
-          publish-profile: ${{ secrets.AZURE_WEBAPP_PUBLISH_PROFILE_FEATHR_RBAC_REGISTRY }}
-          images: 'feathrfeaturestore/feathr-registry:nightly'
-
+        uses: distributhor/workflow-webhook@v3.0.1
+        env:
+          webhook_url: ${{ secrets.AZURE_WEBAPP_FEATHR_RBAC_REGISTRY_WEBHOOK }}
+          
+      - name: Deploy to Feathr SQL Registry Azure Web App
+        id: deploy-to-sql-webapp
+        uses: distributhor/workflow-webhook@v3.0.1
+        env:
+          webhook_url: ${{ secrets.AZURE_WEBAPP_FEATHR_SQL_REGISTRY_WEBHOOK }}

From 6b5cd00557bb3b36061fe8ebbfee883a831ed7c9 Mon Sep 17 00:00:00 2001
From: Jinghui Mo <jmo@linkedin.com>
Date: Wed, 2 Nov 2022 12:09:49 -0400
Subject: [PATCH 62/68] Fix passthrough feature reference in sql-based derived
 feature (#815)

---
 .../derived/strategies/SqlDerivationSpark.scala | 17 ++++++++++++++---
 .../offline/AnchoredFeaturesIntegTest.scala     | 14 ++++++++++++--
 2 files changed, 26 insertions(+), 5 deletions(-)

diff --git a/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala b/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala
index 3afa0a6af..c7b44c1cf 100644
--- a/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala
+++ b/src/main/scala/com/linkedin/feathr/offline/derived/strategies/SqlDerivationSpark.scala
@@ -4,6 +4,7 @@ import com.linkedin.feathr.common.exception.{ErrorLabel, FeathrFeatureTransforma
 import com.linkedin.feathr.offline.client.DataFrameColName
 import com.linkedin.feathr.offline.derived.DerivedFeature
 import com.linkedin.feathr.offline.derived.functions.SQLFeatureDerivationFunction
+import com.linkedin.feathr.offline.job.FeatureTransformation.FEATURE_NAME_PREFIX
 import com.linkedin.feathr.offline.mvel.plugins.FeathrExpressionExecutionContext
 import org.apache.spark.sql.functions.expr
 import org.apache.spark.sql.{DataFrame, SparkSession}
@@ -21,12 +22,14 @@ class SqlDerivationSpark extends SqlDerivationSparkStrategy {
    * @param deriveFeature derived feature definition
    * @param keyTag list of tags represented by integer
    * @param keyTagId2StringMap Map from the tag integer id to the string tag
+   * @param asIsFeatureNames features names that does not to be rewritten, i.e. passthrough features, as they do not have key tags
    * @return Rewritten SQL expression
    */
   private[offline] def rewriteDerivedFeatureExpression(
                                                         deriveFeature: DerivedFeature,
                                                         keyTag:  Seq[Int],
-                                                        keyTagId2StringMap: Seq[String]): String = {
+                                                        keyTagId2StringMap: Seq[String],
+                                                        asIsFeatureNames: Set[String]): String = {
     if (!deriveFeature.derivation.isInstanceOf[SQLFeatureDerivationFunction]) {
       throw new FeathrFeatureTransformationException(ErrorLabel.FEATHR_ERROR, "Should not rewrite derived feature expression for non-SQLDerivedFeatures")
     }
@@ -42,7 +45,7 @@ class SqlDerivationSpark extends SqlDerivationSparkStrategy {
         val namePattern = if (parameterNames.isEmpty) consumeFeatureName.getFeatureName else parameterNames(index)
         // getBinding.map(keyTag.get) resolves the call tags
         val newName =
-          if (!consumeFeatureName.getBinding.isEmpty // Passthrough features do not have keyTag
+          if (!asIsFeatureNames.contains(FEATURE_NAME_PREFIX + consumeFeatureName.getFeatureName)
             // Feature generation code path does not create columns with tags.
             // The check ensures we do not run into IndexOutOfBoundsException when keyTag & keyTagId2StringMap are empty.
             && keyTag.nonEmpty
@@ -98,7 +101,15 @@ class SqlDerivationSpark extends SqlDerivationSparkStrategy {
                       derivationFunction: SQLFeatureDerivationFunction,
                       mvelContext: Option[FeathrExpressionExecutionContext]): DataFrame = {
     // sql expression based derived feature needs rewrite, e.g, replace the feature names with feature column names in the dataframe
-    val rewrittenExpr = rewriteDerivedFeatureExpression(derivedFeature, keyTags, keyTagList)
+    // Passthrough fields do not need rewrite as they do not have tags.
+    val passthroughFieldNames = df.schema.fields.map(f =>
+      if (f.name.startsWith(FEATURE_NAME_PREFIX)) {
+        f.name
+      } else {
+        FEATURE_NAME_PREFIX + f.name
+      }
+    ).toSet
+    val rewrittenExpr = rewriteDerivedFeatureExpression(derivedFeature, keyTags, keyTagList, passthroughFieldNames)
     val tags = Some(keyTags.map(keyTagList).toList)
     val featureColumnName = DataFrameColName.genFeatureColumnName(derivedFeature.producedFeatureNames.head, tags)
     df.withColumn(featureColumnName, expr(rewrittenExpr))
diff --git a/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala b/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala
index db69ea6f2..3735c0f9f 100644
--- a/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala
+++ b/src/test/scala/com/linkedin/feathr/offline/AnchoredFeaturesIntegTest.scala
@@ -484,7 +484,16 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
         |
         |derivations: {
         |   f_trip_time_distance: {
-        |     definition: "f_trip_distance * f_trip_time_duration"
+        |       definition: "f_trip_distance * f_trip_time_duration"
+        |       type: NUMERIC
+        |   }
+        |   f_trip_time_distance_sql: {
+        |    key: [trip]
+        |     inputs: {
+        |       trip_distance: { key: [trip], feature: f_trip_distance }
+        |       trip_time_duration: { key: [trip], feature: f_trip_time_duration }
+        |     }
+        |     definition.sqlExpr: "trip_distance * trip_time_duration"
         |     type: NUMERIC
         |   }
         |}
@@ -514,7 +523,8 @@ class AnchoredFeaturesIntegTest extends FeathrIntegTest {
          |featureList: [
          |  {
          |    key: DOLocationID
-         |    featureList: [f_location_avg_fare, f_trip_time_distance, f_trip_distance, f_trip_time_duration, f_is_long_trip_distance, f_day_of_week]
+         |    featureList: [f_location_avg_fare, f_trip_time_distance, f_trip_distance,
+         |     f_trip_time_duration, f_is_long_trip_distance, f_day_of_week, f_trip_time_distance_sql]
          |  }
          |]
       """.stripMargin

From 8946b4ff1a6d5ecc7f516aa91d0e5335b81e728a Mon Sep 17 00:00:00 2001
From: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
Date: Wed, 2 Nov 2022 09:24:44 -0700
Subject: [PATCH 63/68] Revert databricks example notebook until fixing issues
 (#814)

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>

Signed-off-by: Jun Ki Min <42475935+loomlike@users.noreply.github.com>
---
 ...atabricks_quickstart_nyc_taxi_driver.ipynb | 1444 +++++++++++++++++
 1 file changed, 1444 insertions(+)
 create mode 100644 docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb

diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
new file mode 100644
index 000000000..ffd6e64d8
--- /dev/null
+++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
@@ -0,0 +1,1444 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "384e5e16-7213-4186-9d04-09d03b155534",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "# Feathr Feature Store on Databricks Demo Notebook\n",
+        "\n",
+        "This notebook illustrates the use of Feature Store to create a model that predicts NYC Taxi fares. This is a notebook that's specially designed for databricks clusters and is relying on some of the databricks packages such as dbutils.\n",
+        "\n",
+        "The intent of this notebook is like \"one click run\" without configuring anything, so it has relatively limited capability. \n",
+        "\n",
+        "- For example, in this notebook there's no feature registry available since that requires running Azure Purview. \n",
+        "- Also for online store (Redis), you need to configure the Redis endpoint, otherwise that part will not work. \n",
+        "\n",
+        "However, the core part of Feathr, especially defining features, get offline features, point-in-time joins etc., should \"just work\". The full-fledged notebook is [located here](https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/nyc_driver_demo.ipynb)."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "\n",
+        "# Notebook Steps\n",
+        "\n",
+        "This tutorial demonstrates the key capabilities of Feathr, including:\n",
+        "\n",
+        "1. Install and set up Feathr with Azure\n",
+        "2. Create shareable features with Feathr feature definition configs.\n",
+        "3. Create a training dataset via point-in-time feature join.\n",
+        "4. Compute and write features.\n",
+        "5. Train a model using these features to predict fares.\n",
+        "6. Materialize feature value to online store.\n",
+        "7. Fetch feature value in real-time from online store for online scoring.\n",
+        "\n",
+        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The feature flow is as below:\n",
+        "\n",
+        "![Feature Flow](https://github.com/linkedin/feathr/blob/main/docs/images/feature_flow.png?raw=true)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "f00b9d0b-94d1-418f-89b9-25bbacb8b068",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "! pip install feathr pandavro scikit-learn"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "80223a02-631c-40c8-91b3-a037249ffff9",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "import glob\n",
+        "import os\n",
+        "import tempfile\n",
+        "from datetime import datetime, timedelta\n",
+        "from math import sqrt\n",
+        "\n",
+        "import pandas as pd\n",
+        "import pandavro as pdx\n",
+        "from feathr import FeathrClient\n",
+        "from feathr import BOOLEAN, FLOAT, INT32, ValueType\n",
+        "from feathr import Feature, DerivedFeature, FeatureAnchor\n",
+        "from feathr import BackfillTime, MaterializationSettings\n",
+        "from feathr import FeatureQuery, ObservationSettings\n",
+        "from feathr import RedisSink\n",
+        "from feathr import INPUT_CONTEXT, HdfsSource\n",
+        "from feathr import WindowAggTransformation\n",
+        "from feathr import TypedKey\n",
+        "from sklearn.metrics import mean_squared_error\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "from azure.identity import DefaultAzureCredential\n",
+        "from azure.keyvault.secrets import SecretClient\n",
+        "import json\n",
+        "import requests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "41d3648a-9bc9-40dc-90da-bc82b21ef9b3",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "Get the required databricks credentials automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "331753d6-1850-47b5-ad97-84b7c01d79d1",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "# Get current databricks notebook context\n",
+        "ctx = dbutils.notebook.entry_point.getDbutils().notebook().getContext()\n",
+        "host_name = ctx.tags().get(\"browserHostName\").get()\n",
+        "host_token = ctx.apiToken().get()\n",
+        "cluster_id = ctx.tags().get(\"clusterId\").get()\n",
+        "\n",
+        "\n",
+        "\n",
+        "# databricks_config = {'run_name':'FEATHR_FILL_IN','existing_cluster_id':cluster_id,'libraries':[{'jar':'FEATHR_FILL_IN'}],'spark_jar_task':{'main_class_name':'FEATHR_FILL_IN','parameters':['FEATHR_FILL_IN']}}\n",
+        "os.environ['spark_config__databricks__workspace_instance_url'] = \"https://\" + host_name\n",
+        "os.environ['spark_config__databricks__config_template']='{\"run_name\":\"FEATHR_FILL_IN\",\"new_cluster\":{\"spark_version\":\"10.4.x-scala2.12\",\"node_type_id\":\"Standard_D3_v2\",\"num_workers\":2,\"spark_conf\":{\"FEATHR_FILL_IN\":\"FEATHR_FILL_IN\"}},\"libraries\":[{\"jar\":\"FEATHR_FILL_IN\"}],\"spark_jar_task\":{\"main_class_name\":\"FEATHR_FILL_IN\",\"parameters\":[\"FEATHR_FILL_IN\"]}}'\n",
+        "# os.environ['spark_config__databricks__config_template']=json.dumps(databricks_config)\n",
+        "os.environ['spark_config__databricks__work_dir']='dbfs:/feathr_getting_started'\n",
+        "os.environ['project_config__project_name']='feathr_getting_started'\n",
+        "os.environ['DATABRICKS_WORKSPACE_TOKEN_VALUE'] = host_token"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You need to setup the Redis credentials below in order to push features to online store. You can skip this part if you don't have Redis, but there  will be failures for `client.materialize_features(settings)` API."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Get redis credentials; This is to parse Redis connection string.\n",
+        "redis_port=\"\"\n",
+        "redis_host=\"\"\n",
+        "redis_password=\"\"\n",
+        "redis_ssl=\"\"\n",
+        "\n",
+        "# Set the resource link\n",
+        "os.environ['online_store__redis__host'] = redis_host\n",
+        "os.environ['online_store__redis__port'] = redis_port\n",
+        "os.environ['online_store__redis__ssl_enabled'] = redis_ssl\n",
+        "os.environ['REDIS_PASSWORD']=redis_password"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "08bc3b7e-bbf5-4e3a-9978-fe1aef8c1aee",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "Configure required credentials (skip if you don't use those):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "8cd64e3a-376c-48e6-ba41-5197f3591d48",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "import tempfile\n",
+        "yaml_config = \"\"\"\n",
+        "# Please refer to https://github.com/linkedin/feathr/blob/main/feathr_project/feathrcli/data/feathr_user_workspace/feathr_config.yaml for explanations on the meaning of each field.\n",
+        "api_version: 1\n",
+        "project_config:\n",
+        "  project_name: 'feathr_getting_started2'\n",
+        "  required_environment_variables:\n",
+        "    - 'REDIS_PASSWORD'\n",
+        "offline_store:\n",
+        "  adls:\n",
+        "    adls_enabled: true\n",
+        "  wasb:\n",
+        "    wasb_enabled: true\n",
+        "  s3:\n",
+        "    s3_enabled: false\n",
+        "    s3_endpoint: ''\n",
+        "  jdbc:\n",
+        "    jdbc_enabled: false\n",
+        "    jdbc_database: ''\n",
+        "    jdbc_table: ''\n",
+        "  snowflake:\n",
+        "    snowflake_enabled: false\n",
+        "    url: \"<replace_with_your_snowflake_account>.snowflakecomputing.com\"\n",
+        "    user: \"<replace_with_your_user>\"\n",
+        "    role: \"<replace_with_your_user_role>\"\n",
+        "spark_config:\n",
+        "  # choice for spark runtime. Currently support: azure_synapse, databricks\n",
+        "  # The `databricks` configs will be ignored if `azure_synapse` is set and vice versa.\n",
+        "  spark_cluster: \"databricks\"\n",
+        "  spark_result_output_parts: \"1\"\n",
+        "\n",
+        "online_store:\n",
+        "  redis:\n",
+        "    host: '<replace_with_your_redis>.redis.cache.windows.net'\n",
+        "    port: 6380\n",
+        "    ssl_enabled: True\n",
+        "feature_registry:\n",
+        "  api_endpoint: \"https://<replace_with_your_api_endpoint>.azurewebsites.net/api/v1\"\n",
+        "\"\"\"\n",
+        "tmp = tempfile.NamedTemporaryFile(mode='w', delete=False)\n",
+        "with open(tmp.name, \"w\") as text_file:\n",
+        "    text_file.write(yaml_config)\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "3fef7f2f-df19-4f53-90a5-ff7999ed983d",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "# Initialize Feathr Client"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "9713a2df-c7b2-4562-88b0-b7acce3cc43a",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "client = FeathrClient(config_path=tmp.name)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "c3b64bda-d42c-4a64-b976-0fb604cf38c5",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## View the data\n",
+        "\n",
+        "In this tutorial, we use Feathr Feature Store to create a model that predicts NYC Taxi fares. The dataset comes from [here](https://www1.nyc.gov/site/tlc/about/tlc-trip-record-data.page). The data is as below"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "c4ccd7b3-298a-4e5a-8eec-b7e309db393e",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "import pandas as pd\n",
+        "pd.read_csv(\"https://azurefeathrstorage.blob.core.windows.net/public/sample_data/green_tripdata_2020-04_with_index.csv\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "7430c942-64e5-4b70-b823-16ce1d1b3cee",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## Defining Features with Feathr\n",
+        "\n",
+        "In Feathr, a feature is viewed as a function, mapping from entity id or key, and timestamp to a feature value. For more details on feature definition, please refer to the [Feathr Feature Definition Guide](https://github.com/linkedin/feathr/blob/main/docs/concepts/feature-definition.md)\n",
+        "\n",
+        "\n",
+        "1. The typed key (a.k.a. entity id) identifies the subject of feature, e.g. a user id, 123.\n",
+        "2. The feature name is the aspect of the entity that the feature is indicating, e.g. the age of the user.\n",
+        "3. The feature value is the actual value of that aspect at a particular time, e.g. the value is 30 at year 2022."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "16420730-582e-4e11-a343-efc0ddd35108",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "Note that, in some cases, such as features defined on top of request data, may have no entity key or timestamp.\n",
+        "It is merely a function/transformation executing against request data at runtime.\n",
+        "For example, the day of week of the request, which is calculated by converting the request UNIX timestamp."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "728d2d5f-c11f-4941-bdc5-48507f5749f1",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "### Define Sources Section with UDFs\n",
+        "A feature source is needed for anchored features that describes the raw data in which the feature values are computed from. See the python documentation to get the details on each input column."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "3cc59a0e-a41b-480e-a84e-ca5443d63143",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "batch_source = HdfsSource(name=\"nycTaxiBatchSource\",\n",
+        "                          path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
+        "                          event_timestamp_column=\"lpep_dropoff_datetime\",\n",
+        "                          timestamp_format=\"yyyy-MM-dd HH:mm:ss\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "46f863c4-bb81-434a-a448-6b585031a221",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "### Define Anchors and Features\n",
+        "A feature is called an anchored feature when the feature is directly extracted from the source data, rather than computed on top of other features. The latter case is called derived feature."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "a373ecbe-a040-4cd3-9d87-0d5f4c5ba553",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "f_trip_distance = Feature(name=\"f_trip_distance\",\n",
+        "                          feature_type=FLOAT, transform=\"trip_distance\")\n",
+        "\n",
+        "features = [\n",
+        "    f_trip_distance,\n",
+        "    Feature(name=\"f_is_long_trip_distance\",\n",
+        "            feature_type=BOOLEAN,\n",
+        "            transform=\"cast_float(trip_distance)>30\"),\n",
+        "    Feature(name=\"f_day_of_week\",\n",
+        "            feature_type=INT32,\n",
+        "            transform=\"dayofweek(lpep_dropoff_datetime)\"),\n",
+        "]\n",
+        "\n",
+        "request_anchor = FeatureAnchor(name=\"request_features\",\n",
+        "                               source=INPUT_CONTEXT,\n",
+        "                               features=features)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "149f85e2-fa3c-4895-b0c5-de5543ca9b6d",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "### Window aggregation features\n",
+        "\n",
+        "For window aggregation features, see the supported fields below:\n",
+        "\n",
+        "Note that the `agg_func` should be any of these:\n",
+        "\n",
+        "| Aggregation Type | Input Type | Description |\n",
+        "| --- | --- | --- |\n",
+        "|SUM, COUNT, MAX, MIN, AVG\t|Numeric|Applies the the numerical operation on the numeric inputs. |\n",
+        "|MAX_POOLING, MIN_POOLING, AVG_POOLING\t| Numeric Vector | Applies the max/min/avg operation on a per entry bassis for a given a collection of numbers.|\n",
+        "|LATEST| Any |Returns the latest not-null values from within the defined time window |\n",
+        "\n",
+        "\n",
+        "After you have defined features and sources, bring them together to build an anchor:\n",
+        "\n",
+        "\n",
+        "Note that if the data source is from the observation data, the `source` section should be `INPUT_CONTEXT` to indicate the source of those defined anchors."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "05633bc3-9118-449b-9562-45fc437576c2",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "location_id = TypedKey(key_column=\"DOLocationID\",\n",
+        "                       key_column_type=ValueType.INT32,\n",
+        "                       description=\"location id in NYC\",\n",
+        "                       full_name=\"nyc_taxi.location_id\")\n",
+        "agg_features = [Feature(name=\"f_location_avg_fare\",\n",
+        "                        key=location_id,\n",
+        "                        feature_type=FLOAT,\n",
+        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
+        "                                                          agg_func=\"AVG\",\n",
+        "                                                          window=\"90d\")),\n",
+        "                Feature(name=\"f_location_max_fare\",\n",
+        "                        key=location_id,\n",
+        "                        feature_type=FLOAT,\n",
+        "                        transform=WindowAggTransformation(agg_expr=\"cast_float(fare_amount)\",\n",
+        "                                                          agg_func=\"MAX\",\n",
+        "                                                          window=\"90d\")),\n",
+        "                ]\n",
+        "\n",
+        "agg_anchor = FeatureAnchor(name=\"aggregationFeatures\",\n",
+        "                           source=batch_source,\n",
+        "                           features=agg_features)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "d2ecaca9-057e-4b36-811f-320f66f753ed",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "### Derived Features Section\n",
+        "Derived features are the features that are computed from other features. They could be computed from anchored features, or other derived features."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "270fb11e-8a71-404f-9639-ad29d8e6a2c1",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "\n",
+        "f_trip_distance_rounded = DerivedFeature(name=\"f_trip_distance_rounded\",\n",
+        "                                     feature_type=INT32,\n",
+        "                                     input_features=[f_trip_distance],\n",
+        "                                     transform=\"f_trip_distance * 10\")\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "ad102c45-586d-468c-85f0-9454401ef10b",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "And then we need to build those features so that it can be consumed later. Note that we have to build both the \"anchor\" and the \"derived\" features (which is not anchored to a source)."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "91bb5ebb-87e4-470b-b8eb-1c89b351740e",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "client.build_features(anchor_list=[agg_anchor, request_anchor], derived_feature_list=[\n",
+        "                       f_trip_distance_rounded])"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "632d5f46-f9e2-41a8-aab7-34f75206e2aa",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## Create training data using point-in-time correct feature join\n",
+        "\n",
+        "A training dataset usually contains entity id columns, multiple feature columns, event timestamp column and label/target column. \n",
+        "\n",
+        "To create a training dataset using Feathr, one needs to provide a feature join configuration file to specify\n",
+        "what features and how these features should be joined to the observation data. \n",
+        "\n",
+        "To learn more on this topic, please refer to [Point-in-time Correctness](https://github.com/linkedin/feathr/blob/main/docs/concepts/point-in-time-join.md)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "e438e6d8-162e-4aa3-b3b3-9d1f3b0d2b7f",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "\n",
+        "output_path = 'dbfs:/feathrazure_test.avro'\n",
+        "\n",
+        "\n",
+        "feature_query = FeatureQuery(\n",
+        "    feature_list=[\"f_location_avg_fare\", \"f_trip_distance_rounded\", \"f_is_long_trip_distance\"], key=location_id)\n",
+        "settings = ObservationSettings(\n",
+        "    observation_path=\"wasbs://public@azurefeathrstorage.blob.core.windows.net/sample_data/green_tripdata_2020-04_with_index.csv\",\n",
+        "    event_timestamp_column=\"lpep_dropoff_datetime\",\n",
+        "    timestamp_format=\"yyyy-MM-dd HH:mm:ss\")\n",
+        "client.get_offline_features(observation_settings=settings,\n",
+        "                            feature_query=feature_query,\n",
+        "                            output_path=output_path\n",
+        "                           )\n",
+        "client.wait_job_to_finish(timeout_sec=500)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "51f078e3-3f8f-4f10-b7f1-499ac8a9ff07",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## Download the result and show the result\n",
+        "\n",
+        "Let's use the helper function `get_result_df` to download the result and view it:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "23c797b2-ac1a-4cf3-b0ed-c05216de3f37",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "from feathr.utils.job_utils import get_result_df\n",
+        "df_res = get_result_df(client, format=\"avro\", res_url = output_path)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "b9be042e-eb12-46b9-9d91-a0e5dd0c704f",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "df_res"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "dcbf17fc-7f79-4a65-a3af-9cffbd0b5d1f",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## Train a machine learning model\n",
+        "After getting all the features, let's train a machine learning model with the converted feature by Feathr:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "84745f36-5bac-49c0-903b-38828b923c7c",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "# remove columns\n",
+        "from sklearn.ensemble import GradientBoostingRegressor\n",
+        "final_df = df_res\n",
+        "final_df.drop([\"lpep_pickup_datetime\", \"lpep_dropoff_datetime\",\n",
+        "              \"store_and_fwd_flag\"], axis=1, inplace=True, errors='ignore')\n",
+        "final_df.fillna(0, inplace=True)\n",
+        "final_df['fare_amount'] = final_df['fare_amount'].astype(\"float64\")\n",
+        "\n",
+        "\n",
+        "train_x, test_x, train_y, test_y = train_test_split(final_df.drop([\"fare_amount\"], axis=1),\n",
+        "                                                    final_df[\"fare_amount\"],\n",
+        "                                                    test_size=0.2,\n",
+        "                                                    random_state=42)\n",
+        "model = GradientBoostingRegressor()\n",
+        "model.fit(train_x, train_y)\n",
+        "\n",
+        "y_predict = model.predict(test_x)\n",
+        "\n",
+        "y_actual = test_y.values.flatten().tolist()\n",
+        "rmse = sqrt(mean_squared_error(y_actual, y_predict))\n",
+        "\n",
+        "sum_actuals = sum_errors = 0\n",
+        "\n",
+        "for actual_val, predict_val in zip(y_actual, y_predict):\n",
+        "    abs_error = actual_val - predict_val\n",
+        "    if abs_error < 0:\n",
+        "        abs_error = abs_error * -1\n",
+        "\n",
+        "    sum_errors = sum_errors + abs_error\n",
+        "    sum_actuals = sum_actuals + actual_val\n",
+        "\n",
+        "mean_abs_percent_error = sum_errors / sum_actuals\n",
+        "print(\"Model MAPE:\")\n",
+        "print(mean_abs_percent_error)\n",
+        "print()\n",
+        "print(\"Model Accuracy:\")\n",
+        "print(1 - mean_abs_percent_error)\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "5a226026-1c7b-48db-8f91-88d5c2ddf023",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## Materialize feature value into offline/online storage\n",
+        "\n",
+        "While Feathr can compute the feature value from the feature definition on-the-fly at request time, it can also pre-compute\n",
+        "and materialize the feature value to offline and/or online storage. \n",
+        "\n",
+        "We can push the generated features to the online store like below:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "3b924c66-8634-42fe-90f3-c844487d3f75",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "backfill_time = BackfillTime(start=datetime(\n",
+        "    2020, 5, 20), end=datetime(2020, 5, 20), step=timedelta(days=1))\n",
+        "redisSink = RedisSink(table_name=\"nycTaxiDemoFeature\")\n",
+        "settings = MaterializationSettings(\"nycTaxiTable\",\n",
+        "                                   backfill_time=backfill_time,\n",
+        "                                   sinks=[redisSink],\n",
+        "                                   feature_names=[\"f_location_avg_fare\", \"f_location_max_fare\"])\n",
+        "\n",
+        "client.materialize_features(settings)\n",
+        "client.wait_job_to_finish(timeout_sec=500)\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "6a3e2ab1-5c66-4d27-a737-c5e2af03b1dd",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "We can then get the features from the online store (Redis):"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "bef93538-9591-4247-97b6-289d2055b7b1",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "source": [
+        "## Fetching feature value for online inference\n",
+        "\n",
+        "For features that are already materialized by the previous step, their latest value can be queried via the client's\n",
+        "`get_online_features` or `multi_get_online_features` API."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "0c3d5f35-11a3-4644-9992-5860169d8302",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "res = client.get_online_features('nycTaxiDemoFeature', '265', [\n",
+        "                                 'f_location_avg_fare', 'f_location_max_fare'])"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "application/vnd.databricks.v1+cell": {
+          "inputWidgets": {},
+          "nuid": "4d4699ed-42e6-408f-903d-2f799284f4b6",
+          "showTitle": false,
+          "title": ""
+        }
+      },
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style scoped>\n",
+              "  .ansiout {\n",
+              "    display: block;\n",
+              "    unicode-bidi: embed;\n",
+              "    white-space: pre-wrap;\n",
+              "    word-wrap: break-word;\n",
+              "    word-break: break-all;\n",
+              "    font-family: \"Source Code Pro\", \"Menlo\", monospace;;\n",
+              "    font-size: 13px;\n",
+              "    color: #555;\n",
+              "    margin-left: 4px;\n",
+              "    line-height: 19px;\n",
+              "  }\n",
+              "</style>"
+            ]
+          },
+          "metadata": {
+            "application/vnd.databricks.v1+output": {
+              "arguments": {},
+              "data": "",
+              "errorSummary": "",
+              "errorTraceType": null,
+              "metadata": {},
+              "type": "ipynbError"
+            }
+          },
+          "output_type": "display_data"
+        }
+      ],
+      "source": [
+        "client.multi_get_online_features(\"nycTaxiDemoFeature\", [\"239\", \"265\"], [\n",
+        "                                 'f_location_avg_fare', 'f_location_max_fare'])"
+      ]
+    }
+  ],
+  "metadata": {
+    "application/vnd.databricks.v1+notebook": {
+      "dashboards": [],
+      "language": "python",
+      "notebookMetadata": {
+        "pythonIndentUnit": 4
+      },
+      "notebookName": "nyc_driver_demo",
+      "notebookOrigID": 930353059183053,
+      "widgets": {}
+    },
+    "kernelspec": {
+      "display_name": "Python 3.8.10 ('logistics')",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.10"
+    },
+    "vscode": {
+      "interpreter": {
+        "hash": "6d25d3d1f1809ed0384c3d8e0cd4f1df57fe7bb936ead67f035c6ff1494f4e23"
+      }
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}

From f36b6a509843ed77b55cb93158706bbb884d5399 Mon Sep 17 00:00:00 2001
From: Yuqing Wei <weiyuqing021@outlook.com>
Date: Thu, 3 Nov 2022 14:33:51 +0800
Subject: [PATCH 64/68] add retry logic for purview project-ids logic (#821)

Signed-off-by: Yuqing Wei <weiyuqing021@outlook.com>
---
 registry/access_control/rbac/access.py | 24 ++++++++++++++++++++----
 1 file changed, 20 insertions(+), 4 deletions(-)

diff --git a/registry/access_control/rbac/access.py b/registry/access_control/rbac/access.py
index a25646813..adee628c2 100644
--- a/registry/access_control/rbac/access.py
+++ b/registry/access_control/rbac/access.py
@@ -1,3 +1,4 @@
+from time import sleep
 from typing import Any, Union
 from uuid import UUID
 from fastapi import Depends, HTTPException, status
@@ -23,6 +24,12 @@ def __init__(self, detail: Any = None) -> None:
                          detail=detail, headers={"WWW-Authenticate": "Bearer"})
 
 
+class BadRequest(HTTPException):
+    def __init__(self, detail: Any = None) -> None:
+        super().__init__(status_code=status.HTTP_400_BAD_REQUEST,
+                         detail=detail, headers={"WWW-Authenticate": "Bearer"})
+
+
 def get_user(user: User = Depends(authorize)) -> User:
     return user
 
@@ -72,13 +79,22 @@ def _get_project_name(id_or_name: Union[str, UUID]):
         _to_uuid(id_or_name)
         if id_or_name not in rbac.projects_ids:
             # refresh project id map if id not found
-            _get_projects_ids()
+            _get_projects_ids() 
+            if id_or_name not in rbac.projects_ids:
+                # purview discovery-query api has latency, need retry to avoid new project not included issue.
+                # TODO: Update purview project-ids API to realtime one and remove below patch.
+                count = 0
+                max = 5
+                while id_or_name not in rbac.projects_ids and count < max:
+                    sleep(0.5)
+                    _get_projects_ids()
+                    count += 1
         return rbac.projects_ids[id_or_name]
     except KeyError:
-        raise RuntimeError(f"Project Id {id_or_name} not found in Registry {config.RBAC_REGISTRY_URL}")
+        raise BadRequest(f"Project Id {id_or_name} not found in Registry {config.RBAC_REGISTRY_URL}. Please check if the project exists or retry later.")
     except ValueError:
+        # It is a name
         pass
-    # It is a name
     return id_or_name
 
 
@@ -88,4 +104,4 @@ def _get_projects_ids():
         response = requests.get(url=f"{config.RBAC_REGISTRY_URL}/projects-ids").content.decode('utf-8')
         rbac.projects_ids = json.loads(response)
     except Exception as e:
-        raise RuntimeError(f"Failed to get projects ids from Registry {config.RBAC_REGISTRY_URL}, {e}")
\ No newline at end of file
+        raise BadRequest(f"Failed to get projects ids from Registry {config.RBAC_REGISTRY_URL}, {e}")
\ No newline at end of file

From c89f26dd2b45cd007d413034d84af2d03265e32c Mon Sep 17 00:00:00 2001
From: Blair Chen <blrchen@users.noreply.github.com>
Date: Thu, 3 Nov 2022 16:04:00 +0800
Subject: [PATCH 65/68] Bump version to 0.9.0-rc2 (#822)

---
 build.sbt                                                     | 2 +-
 docs/how-to-guides/local-spark-provider.md                    | 2 +-
 feathr_project/feathr/version.py                              | 2 +-
 feathr_project/test/test_user_workspace/feathr_config.yaml    | 4 ++--
 .../test_user_workspace/feathr_config_registry_purview.yaml   | 4 ++--
 .../feathr_config_registry_purview_rbac.yaml                  | 4 ++--
 .../test/test_user_workspace/feathr_config_registry_sql.yaml  | 4 ++--
 .../test_user_workspace/feathr_config_registry_sql_rbac.yaml  | 4 ++--
 ui/package.json                                               | 2 +-
 9 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/build.sbt b/build.sbt
index 2ad413ba2..a39db0826 100644
--- a/build.sbt
+++ b/build.sbt
@@ -2,7 +2,7 @@ import sbt.Keys.publishLocalConfiguration
 
 ThisBuild / resolvers += Resolver.mavenLocal
 ThisBuild / scalaVersion     := "2.12.15"
-ThisBuild / version          := "0.9.0-rc1"
+ThisBuild / version          := "0.9.0-rc2"
 ThisBuild / organization     := "com.linkedin.feathr"
 ThisBuild / organizationName := "linkedin"
 val sparkVersion = "3.1.3"
diff --git a/docs/how-to-guides/local-spark-provider.md b/docs/how-to-guides/local-spark-provider.md
index 0069322b8..7f63fb042 100644
--- a/docs/how-to-guides/local-spark-provider.md
+++ b/docs/how-to-guides/local-spark-provider.md
@@ -36,7 +36,7 @@ A spark-submit script will auto generated in your workspace under `debug` folder
 spark-submit \
         --master local[*] \
         --name project_feathr_local_spark_test \
-        --packages "org.apache.spark:spark-avro_2.12:3.3.0,com.microsoft.sqlserver:mssql-jdbc:10.2.0.jre8,com.microsoft.azure:spark-mssql-connector_2.12:1.2.0,org.apache.logging.log4j:log4j-core:2.17.2,com.typesafe:config:1.3.4,com.fasterxml.jackson.core:jackson-databind:2.12.6.1,org.apache.hadoop:hadoop-mapreduce-client-core:2.7.7,org.apache.hadoop:hadoop-common:2.7.7,org.apache.avro:avro:1.8.2,org.apache.xbean:xbean-asm6-shaded:4.10,org.apache.spark:spark-sql-kafka-0-10_2.12:3.1.3,com.microsoft.azure:azure-eventhubs-spark_2.12:2.3.21,org.apache.kafka:kafka-clients:3.1.0,com.google.guava:guava:31.1-jre,it.unimi.dsi:fastutil:8.1.1,org.mvel:mvel2:2.2.8.Final,com.fasterxml.jackson.module:jackson-module-scala_2.12:2.13.3,com.fasterxml.jackson.dataformat:jackson-dataformat-yaml:2.12.6,com.fasterxml.jackson.dataformat:jackson-dataformat-csv:2.12.6,com.jasonclawson:jackson-dataformat-hocon:1.1.0,com.redislabs:spark-redis_2.12:3.1.0,org.apache.xbean:xbean-asm6-shaded:4.10,com.google.protobuf:protobuf-java:3.19.4,net.snowflake:snowflake-jdbc:3.13.18,net.snowflake:spark-snowflake_2.12:2.10.0-spark_3.2,org.apache.commons:commons-lang3:3.12.0,org.xerial:sqlite-jdbc:3.36.0.3,com.github.changvvb:jackson-module-caseclass_2.12:1.1.1,com.azure.cosmos.spark:azure-cosmos-spark_3-1_2-12:4.11.1,org.eclipse.jetty:jetty-util:9.3.24.v20180605,commons-io:commons-io:2.6,org.apache.hadoop:hadoop-azure:2.7.4,com.microsoft.azure:azure-storage:8.6.4,com.linkedin.feathr:feathr_2.12:0.9.0-rc1" \
+        --packages "org.apache.spark:spark-avro_2.12:3.3.0,com.microsoft.sqlserver:mssql-jdbc:10.2.0.jre8,com.microsoft.azure:spark-mssql-connector_2.12:1.2.0,org.apache.logging.log4j:log4j-core:2.17.2,com.typesafe:config:1.3.4,com.fasterxml.jackson.core:jackson-databind:2.12.6.1,org.apache.hadoop:hadoop-mapreduce-client-core:2.7.7,org.apache.hadoop:hadoop-common:2.7.7,org.apache.avro:avro:1.8.2,org.apache.xbean:xbean-asm6-shaded:4.10,org.apache.spark:spark-sql-kafka-0-10_2.12:3.1.3,com.microsoft.azure:azure-eventhubs-spark_2.12:2.3.21,org.apache.kafka:kafka-clients:3.1.0,com.google.guava:guava:31.1-jre,it.unimi.dsi:fastutil:8.1.1,org.mvel:mvel2:2.2.8.Final,com.fasterxml.jackson.module:jackson-module-scala_2.12:2.13.3,com.fasterxml.jackson.dataformat:jackson-dataformat-yaml:2.12.6,com.fasterxml.jackson.dataformat:jackson-dataformat-csv:2.12.6,com.jasonclawson:jackson-dataformat-hocon:1.1.0,com.redislabs:spark-redis_2.12:3.1.0,org.apache.xbean:xbean-asm6-shaded:4.10,com.google.protobuf:protobuf-java:3.19.4,net.snowflake:snowflake-jdbc:3.13.18,net.snowflake:spark-snowflake_2.12:2.10.0-spark_3.2,org.apache.commons:commons-lang3:3.12.0,org.xerial:sqlite-jdbc:3.36.0.3,com.github.changvvb:jackson-module-caseclass_2.12:1.1.1,com.azure.cosmos.spark:azure-cosmos-spark_3-1_2-12:4.11.1,org.eclipse.jetty:jetty-util:9.3.24.v20180605,commons-io:commons-io:2.6,org.apache.hadoop:hadoop-azure:2.7.4,com.microsoft.azure:azure-storage:8.6.4,com.linkedin.feathr:feathr_2.12:0.9.0-rc2" \
         --conf "spark.driver.extraClassPath=../target/scala-2.12/classes:jars/config-1.3.4.jar:jars/jackson-dataformat-hocon-1.1.0.jar:jars/jackson-module-caseclass_2.12-1.1.1.jar:jars/mvel2-2.2.8.Final.jar:jars/fastutil-8.1.1.jar" \
         --conf "spark.hadoop.fs.wasbs.impl=org.apache.hadoop.fs.azure.NativeAzureFileSystem" \
         --class com.linkedin.feathr.offline.job.FeatureJoinJob \
diff --git a/feathr_project/feathr/version.py b/feathr_project/feathr/version.py
index f31e00e36..145f98940 100644
--- a/feathr_project/feathr/version.py
+++ b/feathr_project/feathr/version.py
@@ -1 +1 @@
-__version__ = "0.9.0-rc1"
\ No newline at end of file
+__version__ = "0.9.0-rc2"
\ No newline at end of file
diff --git a/feathr_project/test/test_user_workspace/feathr_config.yaml b/feathr_project/test/test_user_workspace/feathr_config.yaml
index f463785d5..94fac6a23 100644
--- a/feathr_project/test/test_user_workspace/feathr_config.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config.yaml
@@ -82,7 +82,7 @@ spark_config:
     # Feathr Job configuration. Support local paths, path start with http(s)://, and paths start with abfs(s)://
     # this is the default location so end users don't have to compile the runtime again.
     # feathr_runtime_location: wasbs://public@azurefeathrstorage.blob.core.windows.net/feathr-assembly-LATEST.jar
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
   databricks:
     # workspace instance
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
@@ -93,7 +93,7 @@ spark_config:
     # Feathr Job location. Support local paths, path start with http(s)://, and paths start with dbfs:/
     work_dir: 'dbfs:/feathr_getting_started'
     # this is the default location so end users don't have to compile the runtime again.
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
index b6e3aacde..2df185fbe 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
index ffef212d2..ff347f59b 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_purview_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
index 8f6691725..215899c3a 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
 
 online_store:
   redis:
diff --git a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
index 03c5f75f1..3b213b343 100644
--- a/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
+++ b/feathr_project/test/test_user_workspace/feathr_config_registry_sql_rbac.yaml
@@ -25,13 +25,13 @@ spark_config:
     workspace_dir: 'abfss://feathrazuretest3fs@feathrazuretest3storage.dfs.core.windows.net/feathr_test_workspace'
     executor_size: 'Small'
     executor_num: 1
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
   databricks:
     workspace_instance_url: 'https://adb-2474129336842816.16.azuredatabricks.net/'
     workspace_token_value: ''
     config_template: {"run_name":"FEATHR_FILL_IN","new_cluster":{"spark_version":"9.1.x-scala2.12","num_workers":1,"spark_conf":{"FEATHR_FILL_IN":"FEATHR_FILL_IN"},"instance_pool_id":"0403-214809-inlet434-pool-l9dj3kwz"},"libraries":[{"jar":"FEATHR_FILL_IN"}],"spark_jar_task":{"main_class_name":"FEATHR_FILL_IN","parameters":["FEATHR_FILL_IN"]}}
     work_dir: 'dbfs:/feathr_getting_started'
-    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc1.jar"
+    feathr_runtime_location: "../../target/scala-2.12/feathr-assembly-0.9.0-rc2.jar"
 
 online_store:
   redis:
diff --git a/ui/package.json b/ui/package.json
index b4e1ce820..c467c7b9e 100644
--- a/ui/package.json
+++ b/ui/package.json
@@ -1,6 +1,6 @@
 {
   "name": "feathr-ui",
-  "version": "0.9.0-rc1",
+  "version": "0.9.0-rc2",
   "private": true,
   "dependencies": {
     "@ant-design/icons": "^4.7.0",

From 512f309b95a2cb7376b9380f47b6c3d15165bea6 Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Thu, 3 Nov 2022 17:05:13 +0800
Subject: [PATCH 66/68] Fix SideMenu display Manageemnt item issue. (#826)

Signed-off-by: Boli Guan <ifendoe@gmail.com>

Signed-off-by: Boli Guan <ifendoe@gmail.com>
---
 ui/src/components/sidemenu/siteMenu.tsx | 2 +-
 ui/src/site.css                         | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/ui/src/components/sidemenu/siteMenu.tsx b/ui/src/components/sidemenu/siteMenu.tsx
index 2159ebaac..8b99d7c48 100644
--- a/ui/src/components/sidemenu/siteMenu.tsx
+++ b/ui/src/components/sidemenu/siteMenu.tsx
@@ -52,7 +52,7 @@ const showManagement = enableRBAC
   ? enableRBAC
   : process.env.REACT_APP_ENABLE_RBAC;
 
-if (showManagement !== "true") {
+if (showManagement === "true") {
   menuItems.push({
     key: "management",
     icon: <ControlOutlined style={{ fontSize: "20px", color: "#6495ed" }} />,
diff --git a/ui/src/site.css b/ui/src/site.css
index e1a42a944..d98952fa3 100644
--- a/ui/src/site.css
+++ b/ui/src/site.css
@@ -61,5 +61,5 @@
 }
 
 .display-flex {
-  display: "flex";
+  display: flex;
 }

From e33d2513f01fe0fb264f7ce654a2281bbf593797 Mon Sep 17 00:00:00 2001
From: Boli Guan <ifendoe@gmail.com>
Date: Thu, 3 Nov 2022 22:10:07 +0800
Subject: [PATCH 67/68] Update text and link (#828)

---
 ui/src/components/footer/index.tsx                    |  4 ++--
 ui/src/pages/home/home.tsx                            | 10 +++++-----
 ui/src/pages/management/components/RoleForm/index.tsx |  4 +++-
 ui/src/pages/management/roleManagement.tsx            |  3 +--
 4 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/ui/src/components/footer/index.tsx b/ui/src/components/footer/index.tsx
index 8cc36c40d..08439b9b9 100644
--- a/ui/src/components/footer/index.tsx
+++ b/ui/src/components/footer/index.tsx
@@ -15,8 +15,8 @@ const FooterBar = () => {
   return (
     <Footer className={styles.footer}>
       <Space size={32}>
-        <span>version {process.env.FEATHR_VERSION}</span>
-        <span> generated at {generatedTime}</span>
+        <span>Feathr UI Version: {process.env.FEATHR_VERSION}</span>
+        <span>Feathr UI Build Generated at {generatedTime}</span>
       </Space>
     </Footer>
   );
diff --git a/ui/src/pages/home/home.tsx b/ui/src/pages/home/home.tsx
index fb3751448..824d5db95 100644
--- a/ui/src/pages/home/home.tsx
+++ b/ui/src/pages/home/home.tsx
@@ -96,7 +96,7 @@ const Home = () => {
               <li>
                 <a
                   target="_blank"
-                  href="https://github.com/linkedin/feathr#-documentation"
+                  href="https://github.com/feathr-ai/feathr#-documentation"
                   rel="noreferrer"
                 >
                   Documentation
@@ -106,7 +106,7 @@ const Home = () => {
               <li>
                 <a
                   target="_blank"
-                  href="https://github.com/linkedin/feathr#%EF%B8%8F-running-feathr-on-cloud-with-a-few-simple-steps"
+                  href="https://github.com/feathr-ai/feathr#%EF%B8%8F-running-feathr-on-cloud-with-a-few-simple-steps"
                   rel="noreferrer"
                 >
                   Running Feathr on Cloud
@@ -116,7 +116,7 @@ const Home = () => {
               <li>
                 <a
                   target="_blank"
-                  href="https://github.com/linkedin/feathr#%EF%B8%8F-cloud-integrations-and-architecture"
+                  href="https://github.com/feathr-ai/feathr#%EF%B8%8F-cloud-integrations-and-architecture"
                   rel="noreferrer"
                 >
                   Cloud Integrations and Architecture on Cloud
@@ -126,7 +126,7 @@ const Home = () => {
               <li>
                 <a
                   target="_blank"
-                  href="https://github.com/linkedin/feathr#-slack-channel"
+                  href="https://github.com/feathr-ai/feathr#-slack-channel"
                   rel="noreferrer"
                 >
                   Slack Channel
@@ -137,7 +137,7 @@ const Home = () => {
               <li>
                 <a
                   target="_blank"
-                  href="https://github.com/linkedin/feathr#-community-guidelines"
+                  href="https://github.com/feathr-ai/feathr#-community-guidelines"
                   rel="noreferrer"
                 >
                   Community Guidelines
diff --git a/ui/src/pages/management/components/RoleForm/index.tsx b/ui/src/pages/management/components/RoleForm/index.tsx
index 0a77b1610..5cef3d02c 100644
--- a/ui/src/pages/management/components/RoleForm/index.tsx
+++ b/ui/src/pages/management/components/RoleForm/index.tsx
@@ -92,7 +92,9 @@ const RoleForm = (props: RoleFormProps, ref: any) => {
       <Item label="Scope" name="scope" rules={ValidateRule.scope}>
         <Select
           showSearch
-          placeholder="Select project Name or Global"
+          placeholder={
+            'Select project name in the drop-down list, or use "global" to grant access for all the projects.'
+          }
           options={scopeOptions}
           filterOption={(input: string, option?: any) => {
             return (option!.value as unknown as string)
diff --git a/ui/src/pages/management/roleManagement.tsx b/ui/src/pages/management/roleManagement.tsx
index 5bc7b9a2d..15ea9a210 100644
--- a/ui/src/pages/management/roleManagement.tsx
+++ b/ui/src/pages/management/roleManagement.tsx
@@ -18,8 +18,7 @@ const RoleManagement = () => {
           {showAlert && (
             <Alert
               type="warning"
-              message="You are not admin of any project. Only Project Admins
-      can retrieve management details and grant or delete user roles."
+              message="You are not admin of any project. Only project admins can see details on this management page, as well as grant or delete user roles."
             />
           )}
           <Title level={3}>Role Management</Title>

From c203d699115ac148085404b0640229571a2b0b39 Mon Sep 17 00:00:00 2001
From: Xiaoyong Zhu <xiaoyongzhu@users.noreply.github.com>
Date: Thu, 3 Nov 2022 20:25:55 -0700
Subject: [PATCH 68/68] fix sample issues due to derived feature engine change
 (#829)

* fix sample issues due to derived feature engine change

* add `allow_materialize_non_agg_feature` param in notebooks

* add all tenant when logging in

* Update _synapse_submission.py
---
 .../azure_synapse/product_recommendation_demo.ipynb       | 4 ++--
 docs/samples/customer360/Customer360.ipynb                | 2 +-
 .../databricks_quickstart_nyc_taxi_driver.ipynb           | 4 ++--
 docs/samples/fraud_detection_demo.ipynb                   | 4 ++--
 docs/samples/nyc_taxi_demo.ipynb                          | 4 ++--
 docs/samples/product_recommendation_demo_advanced.ipynb   | 8 ++++----
 .../feathr/spark_provider/_synapse_submission.py          | 2 +-
 7 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/docs/samples/azure_synapse/product_recommendation_demo.ipynb b/docs/samples/azure_synapse/product_recommendation_demo.ipynb
index e93860269..dc6eddf88 100644
--- a/docs/samples/azure_synapse/product_recommendation_demo.ipynb
+++ b/docs/samples/azure_synapse/product_recommendation_demo.ipynb
@@ -485,7 +485,7 @@
         "                                      key=user_id,\n",
         "                                      feature_type=FLOAT,\n",
         "                                      input_features=[feature_user_gift_card_balance, feature_user_has_valid_credit_card],\n",
-        "                                      transform=\"feature_user_gift_card_balance + if_else(toBoolean(feature_user_has_valid_credit_card), 100, 0)\")"
+        "                                      transform=\"feature_user_gift_card_balance + if(boolean(feature_user_has_valid_credit_card), 100, 0)\")"
       ]
     },
     {
@@ -675,7 +675,7 @@
         "                                   sinks=[redisSink],\n",
         "                                   feature_names=[\"feature_user_age\", \"feature_user_gift_card_balance\"])\n",
         "\n",
-        "feathr_client.materialize_features(settings)\n",
+        "feathr_client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
         "feathr_client.wait_job_to_finish(timeout_sec=500)"
       ]
     },
diff --git a/docs/samples/customer360/Customer360.ipynb b/docs/samples/customer360/Customer360.ipynb
index db042011b..8d0d8b634 100644
--- a/docs/samples/customer360/Customer360.ipynb
+++ b/docs/samples/customer360/Customer360.ipynb
@@ -854,7 +854,7 @@
             "                                   sinks=[redisSink],\n",
             "                                   feature_names=[\"f_avg_item_ordered_by_customer\",\"f_avg_customer_discount_amount\"])\n",
             "\n",
-            "client.materialize_features(settings)\n",
+            "client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
             "client.wait_job_to_finish(timeout_sec=500)"
          ]
       },
diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
index ffd6e64d8..32a880431 100644
--- a/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
+++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_driver.ipynb
@@ -243,7 +243,7 @@
       "cell_type": "markdown",
       "metadata": {},
       "source": [
-        "You need to setup the Redis credentials below in order to push features to online store. You can skip this part if you don't have Redis, but there  will be failures for `client.materialize_features(settings)` API."
+        "You need to setup the Redis credentials below in order to push features to online store. You can skip this part if you don't have Redis, but there  will be failures for `client.materialize_features(settings, allow_materialize_non_agg_feature =True)` API."
       ]
     },
     {
@@ -1271,7 +1271,7 @@
         "                                   sinks=[redisSink],\n",
         "                                   feature_names=[\"f_location_avg_fare\", \"f_location_max_fare\"])\n",
         "\n",
-        "client.materialize_features(settings)\n",
+        "client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
         "client.wait_job_to_finish(timeout_sec=500)\n"
       ]
     },
diff --git a/docs/samples/fraud_detection_demo.ipynb b/docs/samples/fraud_detection_demo.ipynb
index 0f35bc3bb..2b5da39d3 100644
--- a/docs/samples/fraud_detection_demo.ipynb
+++ b/docs/samples/fraud_detection_demo.ipynb
@@ -169,7 +169,7 @@
                 "adls_fs_name=resource_prefix+\"fs\"\n",
                 "purview_name=resource_prefix+\"purview\"\n",
                 "key_vault_uri = f\"https://{key_vault_name}.vault.azure.net\"\n",
-                "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False)\n",
+                "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False, additionally_allowed_tenants=['*'])\n",
                 "client = SecretClient(vault_url=key_vault_uri, credential=credential)\n",
                 "secretName = \"FEATHR-ONLINE-STORE-CONN\"\n",
                 "retrieved_secret = client.get_secret(secretName).value\n",
@@ -899,7 +899,7 @@
                 "                                   sinks=[redisSink],\n",
                 "                                   feature_names=[\"fraud_status\"])\n",
                 "\n",
-                "client.materialize_features(settings)\n",
+                "client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
                 "client.wait_job_to_finish(timeout_sec=5000)"
             ]
         },
diff --git a/docs/samples/nyc_taxi_demo.ipynb b/docs/samples/nyc_taxi_demo.ipynb
index e5fa7904b..0de7662b2 100644
--- a/docs/samples/nyc_taxi_demo.ipynb
+++ b/docs/samples/nyc_taxi_demo.ipynb
@@ -147,7 +147,7 @@
         "adls_fs_name=resource_prefix+\"fs\"\n",
         "purview_name=resource_prefix+\"purview\"\n",
         "key_vault_uri = f\"https://{key_vault_name}.vault.azure.net\"\n",
-        "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False)\n",
+        "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False, additionally_allowed_tenants=['*'])\n",
         "client = SecretClient(vault_url=key_vault_uri, credential=credential)\n",
         "secretName = \"FEATHR-ONLINE-STORE-CONN\"\n",
         "retrieved_secret = client.get_secret(secretName).value\n",
@@ -630,7 +630,7 @@
         "                                   sinks=[redisSink],\n",
         "                                   feature_names=[\"f_location_avg_fare\", \"f_location_max_fare\"])\n",
         "\n",
-        "client.materialize_features(settings)\n",
+        "client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
         "client.wait_job_to_finish(timeout_sec=500)\n"
       ]
     },
diff --git a/docs/samples/product_recommendation_demo_advanced.ipynb b/docs/samples/product_recommendation_demo_advanced.ipynb
index 169d0f0ad..ecaff5852 100644
--- a/docs/samples/product_recommendation_demo_advanced.ipynb
+++ b/docs/samples/product_recommendation_demo_advanced.ipynb
@@ -270,7 +270,7 @@
             "adls_fs_name=resource_prefix+\"fs\"\n",
             "purview_name=resource_prefix+\"purview\"\n",
             "key_vault_uri = f\"https://{key_vault_name}.vault.azure.net\"\n",
-            "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False)\n",
+            "credential = DefaultAzureCredential(exclude_interactive_browser_credential=False, additionally_allowed_tenants=['*'])\n",
             "client = SecretClient(vault_url=key_vault_uri, credential=credential)\n",
             "secretName = \"FEATHR-ONLINE-STORE-CONN\"\n",
             "retrieved_secret = client.get_secret(secretName).value\n",
@@ -781,7 +781,7 @@
             "                                      feature_type=FLOAT,\n",
             "                                      input_features=[\n",
             "                                          feature_user_gift_card_balance, feature_user_has_valid_credit_card],\n",
-            "                                      transform=\"feature_user_gift_card_balance + if_else(toBoolean(feature_user_has_valid_credit_card), 100, 0)\")"
+            "                                      transform=\"feature_user_gift_card_balance + if(boolean(feature_user_has_valid_credit_card), 100, 0)\")"
          ]
       },
       {
@@ -1037,7 +1037,7 @@
             "                                   sinks=[redisSink],\n",
             "                                   feature_names=[\"feature_user_age\", \"feature_user_gift_card_balance\"])\n",
             "\n",
-            "client.materialize_features(settings)\n",
+            "client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
             "client.wait_job_to_finish(timeout_sec=1000)"
          ]
       },
@@ -1144,7 +1144,7 @@
             "                                   sinks=[redisSink],\n",
             "                                   feature_names=[\"feature_product_price\"])\n",
             "\n",
-            "client.materialize_features(settings)\n",
+            "client.materialize_features(settings, allow_materialize_non_agg_feature =True)\n",
             "client.wait_job_to_finish(timeout_sec=1000)"
          ]
       },
diff --git a/feathr_project/feathr/spark_provider/_synapse_submission.py b/feathr_project/feathr/spark_provider/_synapse_submission.py
index 010444715..53df12c13 100644
--- a/feathr_project/feathr/spark_provider/_synapse_submission.py
+++ b/feathr_project/feathr/spark_provider/_synapse_submission.py
@@ -114,6 +114,7 @@ def submit_feathr_job(self, job_name: str, main_jar_path: str = None,  main_clas
         if not main_jar_path:
             # We don't have the main jar, use Maven
             # Add Maven dependency to the job configuration
+            logger.info(f"Main JAR file is not set, using default package '{FEATHR_MAVEN_ARTIFACT}' from Maven")
             if "spark.jars.packages" in cfg:
                 cfg["spark.jars.packages"] = ",".join(
                     [cfg["spark.jars.packages"], FEATHR_MAVEN_ARTIFACT])
@@ -124,7 +125,6 @@ def submit_feathr_job(self, job_name: str, main_jar_path: str = None,  main_clas
                 # This is a JAR job
                 # Azure Synapse/Livy doesn't allow JAR job starts from Maven directly, we must have a jar file uploaded.
                 # so we have to use a dummy jar as the main file.
-                logger.info(f"Main JAR file is not set, using default package '{FEATHR_MAVEN_ARTIFACT}' from Maven")
                 # Use the no-op jar as the main file
                 # This is a dummy jar which contains only one `org.example.Noop` class with one empty `main` function which does nothing
                 current_dir = pathlib.Path(__file__).parent.resolve()