diff --git a/README.md b/README.md index 3bd8ccce0..cc3a63602 100644 --- a/README.md +++ b/README.md @@ -203,6 +203,10 @@ data-validation (--verbose or -v) validate row Comma-separated key value pair labels for the run. [--format or -fmt] Format for stdout output. Supported formats are (text, csv, json, table). Defaults to table. + [--use-random-row or -rr] + Finds a set of random rows of the first primary key supplied. + [--random-row-batch-size or -rbs] + Row batch size used for random row filters (default 10,000). ``` #### Schema Validations diff --git a/data_validation/query_builder/random_row_builder.py b/data_validation/query_builder/random_row_builder.py index c94173e7c..60ef2b8d7 100644 --- a/data_validation/query_builder/random_row_builder.py +++ b/data_validation/query_builder/random_row_builder.py @@ -20,6 +20,7 @@ import ibis.expr.rules as rlz import ibis.backends.base_sqlalchemy.compiler as sql_compiler from ibis_bigquery import BigQueryClient +from ibis.backends.impala.client import ImpalaClient from ibis.backends.pandas.client import PandasClient import ibis.backends.pandas.execution.util as pandas_util @@ -43,6 +44,7 @@ RANDOM_SORT_SUPPORTS = { PandasClient: "NA", BigQueryClient: "RAND()", + ImpalaClient: "RAND()", }