From 7385d8bb38d32b09f533e692b8d7e03bc23f35d0 Mon Sep 17 00:00:00 2001 From: Robert DeRienzo Date: Wed, 5 Jun 2024 00:08:53 -0400 Subject: [PATCH] #213 Add delta-lake as another extra to reduce deps by 200Mb (#242) Co-authored-by: Robert DeRienzo --- CHANGELOG.md | 2 +- README.md | 1 + pyproject.toml | 9 +++++++-- 3 files changed, 9 insertions(+), 3 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index a032f369..b0084665 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -9,7 +9,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 ### Changed - Introduced optional dependencies/extras for significantly faster installation times. (#213) - +- Added delta-lake as an additional optional dependency ## [0.10.7] - 2024-05-31 diff --git a/README.md b/README.md index 537aacf4..5bc57896 100644 --- a/README.md +++ b/README.md @@ -190,6 +190,7 @@ A list of available extras: | Avro Support | `pip install datacontract-cli[avro]` | | Google BigQuery | `pip install datacontract-cli[bigquery]` | | Databricks Integration | `pip install datacontract-cli[databricks]` | +| Deltalake Integration | `pip install datacontract-cli[deltalake]` | | Kafka Integration | `pip install datacontract-cli[kafka]` | | PostgreSQL Integration | `pip install datacontract-cli[postgres]` | | S3 Integration | `pip install datacontract-cli[s3]` | diff --git a/pyproject.toml b/pyproject.toml index c9b09213..768c10cb 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -32,7 +32,6 @@ dependencies = [ "rdflib==7.0.0", "opentelemetry-exporter-otlp-proto-grpc~=1.16", "opentelemetry-exporter-otlp-proto-http~=1.16", - "deltalake~=0.17.0", "boto3>=1.34.41,<1.34.114", "botocore>=1.34.41,<1.34.114", "jinja_partials >= 0.2.1" @@ -48,12 +47,18 @@ bigquery = [ "soda-core-bigquery>=3.3.1,<3.4.0" ] + + databricks = [ "soda-core-spark-df>=3.3.1,<3.4.0", "databricks-sql-connector>=3.1.2,<3.2.0", "soda-core-spark[databricks]>=3.3.1,<3.4.0" ] +deltalake = [ + "deltalake~=0.17.0" +] + kafka = [ "datacontract-cli[avro]", "soda-core-spark-df>=3.3.1,<3.4.0" @@ -77,7 +82,7 @@ sqlserver = [ ] all = [ - "datacontract-cli[kafka,bigquery,snowflake,postgres,databricks,sqlserver,s3]" + "datacontract-cli[kafka,bigquery,snowflake,postgres,databricks,sqlserver,s3,deltalake]" ] dev = [