diff --git a/discoverx/dx.py b/discoverx/dx.py index c280929..5136621 100644 --- a/discoverx/dx.py +++ b/discoverx/dx.py @@ -61,10 +61,18 @@ def intro(self):
- I'm here to help you discover data in your lakehouse.
- You can scan your lakehouse by using
+ I'm here to help you paralelize multi-table operations across your lakehouse.
+ You can start by defining the set of tables to run operations on (use "*" as a wildcard)
+
dx.from_tables("*.*.*")
+ + Then you can apply the following operations +
.apply_sql(...)
- Runs a SQL template on each table.scan(...)
- Scan your lakehouse for columns matching the given rules.search(...)
- Search your lakehouse for columns matching the given search termdx.scan(from_tables="*.*.*")
For more detailed instructions, check out the readme or use