easy_sql.sql_processor.backend.spark

Module Contents

Classes

SparkBackend

SparkRow

SparkTable

class easy_sql.sql_processor.backend.spark.SparkBackend(spark, scala_udf_initializer=None)

Bases: easy_sql.sql_processor.backend.base.Backend

digraph inheritance8858674047 { bgcolor=transparent; rankdir=LR; size="8.0, 12.0"; "Backend" [URL="../base/index.html#easy_sql.sql_processor.backend.base.Backend",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top"]; "SparkBackend" [URL="#easy_sql.sql_processor.backend.spark.SparkBackend",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top"]; "Backend" -> "SparkBackend" [arrowsize=0.5,style="setlinewidth(0.5)"]; }
Parameters

scala_udf_initializer (Optional[str]) –

broadcast_table(self, table, name)
Parameters
clean(self)
clear_cache(self)
clear_temp_tables(self, exclude=None)
Parameters

exclude (Optional[List[str]]) –

create_cache_table(self, table, name)
Parameters
create_empty_table(self)
create_table_with_data(self, full_table_name, values, schema, partitions)
Parameters
create_temp_table(self, table, name)
Parameters
create_temp_table_with_data(self, table_name, values, schema)
Parameters
  • table_name (str) –

  • values (List[List[Any]]) –

  • schema (pyspark.sql.types.StructType) –

exec_native_sql(self, sql)
Parameters

sql (str) –

Return type

pyspark.sql.DataFrame

exec_sql(self, sql)
Parameters

sql (str) –

Return type

easy_sql.sql_processor.backend.base.Table

init_udfs(self, scala_udf_initializer=None, *args, **kwargs)
Parameters

scala_udf_initializer (Optional[str]) –

refresh_table_partitions(self, table)
Parameters

table (easy_sql.sql_processor.backend.base.TableMeta) –

register_udfs(self, funcs)
Parameters

funcs (Dict[str, Callable]) –

reset(self)
save_table(self, source_table_meta, target_table_meta, save_mode, create_target_table)
Parameters
save_table_sql(self, source_table, source_table_sql, target_table)
Parameters
Return type

str

set_spark_configs(self, configs)
Parameters

configs (Dict[str, str]) –

table_exists(self, table)
Parameters

table (easy_sql.sql_processor.backend.base.TableMeta) –

temp_tables(self)
Return type

List[str]

class easy_sql.sql_processor.backend.spark.SparkRow(row)

Bases: easy_sql.sql_processor.backend.base.Row

digraph inheritance9f8f4acc72 { bgcolor=transparent; rankdir=LR; size="8.0, 12.0"; "Row" [URL="../base/index.html#easy_sql.sql_processor.backend.base.Row",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top"]; "SparkRow" [URL="#easy_sql.sql_processor.backend.spark.SparkRow",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top"]; "Row" -> "SparkRow" [arrowsize=0.5,style="setlinewidth(0.5)"]; }
as_dict(self)
as_tuple(self)
Return type

Tuple

class easy_sql.sql_processor.backend.spark.SparkTable(df)

Bases: easy_sql.sql_processor.backend.base.Table

digraph inheritance02a34f2612 { bgcolor=transparent; rankdir=LR; size="8.0, 12.0"; "SparkTable" [URL="#easy_sql.sql_processor.backend.spark.SparkTable",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top"]; "Table" -> "SparkTable" [arrowsize=0.5,style="setlinewidth(0.5)"]; "Table" [URL="../base/index.html#easy_sql.sql_processor.backend.base.Table",fillcolor=white,fontname="Vera Sans, DejaVu Sans, Liberation Sans, Arial, Helvetica, sans",fontsize=10,height=0.25,shape=box,style="setlinewidth(0.5),filled",target="_top"]; }
collect(self)
Return type

List[easy_sql.sql_processor.backend.base.Row]

count(self)
Return type

int

field_names(self)
Return type

List[str]

first(self)
Return type

easy_sql.sql_processor.backend.base.Row

is_empty(self)
Return type

bool

limit(self, count)
Parameters

count (int) –

Return type

SparkTable

show(self, count=20)
Parameters

count (int) –

with_column(self, name, value)
Parameters
  • name (str) –

  • value (Any) –

Return type

SparkTable