Commit4cb15fd

committed

improved models and filters from cloudfetch-sea branch

Signed-off-by: varun-edachali-dbx <varun.edachali@databricks.com>

1 parent0216d7a commit4cb15fdCopy full SHA for 4cb15fd

File tree

4 files changed

+187

-49

lines changed

src/databricks/sql/backend
- filters.py
- sea/models

4 files changed

+187

-49

lines changed

`‎src/databricks/sql/backend/filters.py‎`

Lines changed: 39 additions & 22 deletions

Original file line number	Diff line number	Diff line change
`@@ -9,14 +9,20 @@`
`9`	`9`	`List,`
`10`	`10`	`Optional,`
`11`	`11`	`Any,`
	`12`	`+Dict,`
`12`	`13`	`Callable,`
	`14`	`+TypeVar,`
	`15`	`+Generic,`
	`16`	`+cast,`
`13`	`17`	`TYPE_CHECKING,`
`14`	`18`	`)`
`15`	`19`
`16`		`-ifTYPE_CHECKING:`
`17`		`-fromdatabricks.sql.result_setimportResultSet`
	`20`	`+fromdatabricks.sql.utilsimportJsonQueue,SeaResultSetQueueFactory`
	`21`	`+fromdatabricks.sql.backend.typesimportExecuteResponse,CommandId`
	`22`	`+fromdatabricks.sql.backend.sea.models.baseimportResultData`
`18`	`23`
`19`		`-fromdatabricks.sql.result_setimportSeaResultSet`
	`24`	`+ifTYPE_CHECKING:`
	`25`	`+fromdatabricks.sql.result_setimportResultSet,SeaResultSet`
`20`	`26`
`21`	`27`	`logger=logging.getLogger(__name__)`
`22`	`28`
`@@ -43,26 +49,35 @@ def _filter_sea_result_set(`
`43`	`49`	`Returns:`
`44`	`50`	`A filtered SEA result set`
`45`	`51`	`"""`
`46`		`-# Create a filtered version of the result set`
`47`		`-filtered_response=result_set._response.copy()`
`48`		`-`
`49`		`-# If there's a result with rows, filter them`
`50`		`-if (`
`51`		`-"result"infiltered_response`
`52`		`-and"data_array"infiltered_response["result"]`
`53`		`- ):`
`54`		`-rows=filtered_response["result"]["data_array"]`
`55`		`-filtered_rows= [rowforrowinrowsiffilter_func(row)]`
`56`		`-filtered_response["result"]["data_array"]=filtered_rows`
`57`		`-`
`58`		`-# Update row count if present`
`59`		`-if"row_count"infiltered_response["result"]:`
`60`		`-filtered_response["result"]["row_count"]=len(filtered_rows)`
`61`		`-`
`62`		`-# Create a new result set with the filtered data`
	`52`	`+# Get all remaining rows`
	`53`	`+original_index=result_set.results.cur_row_index`
	`54`	`+result_set.results.cur_row_index=0# Reset to beginning`
	`55`	`+all_rows=result_set.results.remaining_rows()`
	`56`	`+`
	`57`	`+# Filter rows`
	`58`	`+filtered_rows= [rowforrowinall_rowsiffilter_func(row)]`
	`59`	`+`
	`60`	`+# Import SeaResultSet here to avoid circular imports`
	`61`	`+fromdatabricks.sql.result_setimportSeaResultSet`
	`62`	`+`
	`63`	`+# Reuse the command_id from the original result set`
	`64`	`+command_id=result_set.command_id`
	`65`	`+`
	`66`	`+# Create an ExecuteResponse with the filtered data`
	`67`	`+execute_response=ExecuteResponse(`
	`68`	`+command_id=command_id,`
	`69`	`+status=result_set.status,`
	`70`	`+description=result_set.description,`
	`71`	`+has_more_rows=result_set._has_more_rows,`
	`72`	`+results_queue=JsonQueue(filtered_rows),`
	`73`	`+has_been_closed_server_side=result_set.has_been_closed_server_side,`
	`74`	`+lz4_compressed=False,`
	`75`	`+is_staging_operation=False,`
	`76`	`+ )`
	`77`	`+`
`63`	`78`	`returnSeaResultSet(`
`64`	`79`	`connection=result_set.connection,`
`65`		`-sea_response=filtered_response,`
	`80`	`+execute_response=execute_response,`
`66`	`81`	`sea_client=result_set.backend,`
`67`	`82`	`buffer_size_bytes=result_set.buffer_size_bytes,`
`68`	`83`	`arraysize=result_set.arraysize,`
`@@ -92,6 +107,8 @@ def filter_by_column_values(`
`92`	`107`	`allowed_values= [v.upper()forvinallowed_values]`
`93`	`108`
`94`	`109`	`# Determine the type of result set and apply appropriate filtering`
	`110`	`+fromdatabricks.sql.result_setimportSeaResultSet`
	`111`	`+`
`95`	`112`	`ifisinstance(result_set,SeaResultSet):`
`96`	`113`	`returnResultSetFilter._filter_sea_result_set(`
`97`	`114`	`result_set,`
`@@ -137,7 +154,7 @@ def filter_tables_by_type(`
`137`	`154`	`table_typesiftable_typesandlen(table_types)>0elseDEFAULT_TABLE_TYPES`
`138`	`155`	`)`
`139`	`156`
`140`		`-# Table type istypically inthe 6th column (index 5)`
	`157`	`+# Table type is the 6th column (index 5)`
`141`	`158`	`returnResultSetFilter.filter_by_column_values(`
`142`	`159`	`result_set,5,valid_types,case_sensitive=False`
`143`	`160`	`)`

`‎src/databricks/sql/backend/sea/models/base.py‎`

Lines changed: 11 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -34,6 +34,12 @@ class ExternalLink:`
`34`	`34`	`external_link:str`
`35`	`35`	`expiration:str`
`36`	`36`	`chunk_index:int`
	`37`	`+byte_count:int=0`
	`38`	`+row_count:int=0`
	`39`	`+row_offset:int=0`
	`40`	`+next_chunk_index:Optional[int]=None`
	`41`	`+next_chunk_internal_link:Optional[str]=None`
	`42`	`+http_headers:Optional[Dict[str,str]]=None`
`37`	`43`
`38`	`44`
`39`	`45`	`@dataclass`
`@@ -61,8 +67,11 @@ class ColumnInfo:`
`61`	`67`	`classResultManifest:`
`62`	`68`	`"""Manifest information for a result set."""`
`63`	`69`
`64`		`-schema:List[ColumnInfo]`
	`70`	`+format:str`
	`71`	`+schema:Dict[str,Any]# Will contain column information`
`65`	`72`	`total_row_count:int`
`66`	`73`	`total_byte_count:int`
	`74`	`+total_chunk_count:int`
`67`	`75`	`truncated:bool=False`
`68`		`-chunk_count:Optional[int]=None`
	`76`	`+chunks:Optional[List[Dict[str,Any]]]=None`
	`77`	`+result_compression:Optional[str]=None`

`‎src/databricks/sql/backend/sea/models/requests.py‎`

Lines changed: 4 additions & 12 deletions

Original file line number	Diff line number	Diff line change
`@@ -21,18 +21,16 @@ class StatementParameter:`
`21`	`21`	`classExecuteStatementRequest:`
`22`	`22`	`"""Request to execute a SQL statement."""`
`23`	`23`
`24`		`-warehouse_id:str`
`25`		`-statement:str`
`26`	`24`	`session_id:str`
	`25`	`+statement:str`
	`26`	`+warehouse_id:str`
`27`	`27`	`disposition:str="EXTERNAL_LINKS"`
`28`	`28`	`format:str="JSON_ARRAY"`
	`29`	`+result_compression:Optional[str]=None`
	`30`	`+parameters:Optional[List[StatementParameter]]=None`
`29`	`31`	`wait_timeout:str="10s"`
`30`	`32`	`on_wait_timeout:str="CONTINUE"`
`31`	`33`	`row_limit:Optional[int]=None`
`32`		`-parameters:Optional[List[StatementParameter]]=None`
`33`		`-catalog:Optional[str]=None`
`34`		`-schema:Optional[str]=None`
`35`		`-result_compression:Optional[str]=None`
`36`	`34`
`37`	`35`	`defto_dict(self)->Dict[str,Any]:`
`38`	`36`	`"""Convert the request to a dictionary for JSON serialization."""`
`@@ -49,12 +47,6 @@ def to_dict(self) -> Dict[str, Any]:`
`49`	`47`	`ifself.row_limitisnotNoneandself.row_limit>0:`
`50`	`48`	`result["row_limit"]=self.row_limit`
`51`	`49`
`52`		`-ifself.catalog:`
`53`		`-result["catalog"]=self.catalog`
`54`		`-`
`55`		`-ifself.schema:`
`56`		`-result["schema"]=self.schema`
`57`		`-`
`58`	`50`	`ifself.result_compression:`
`59`	`51`	`result["result_compression"]=self.result_compression`
`60`	`52`

`‎src/databricks/sql/backend/sea/models/responses.py‎`

Lines changed: 133 additions & 13 deletions

Original file line number	Diff line number	Diff line change
`@@ -13,6 +13,8 @@`
`13`	`13`	`ResultManifest,`
`14`	`14`	`ResultData,`
`15`	`15`	`ServiceError,`
	`16`	`+ExternalLink,`
	`17`	`+ColumnInfo,`
`16`	`18`	`)`
`17`	`19`
`18`	`20`
`@@ -37,20 +39,62 @@ def from_dict(cls, data: Dict[str, Any]) -> "ExecuteStatementResponse":`
`37`	`39`	`error_code=error_data.get("error_code"),`
`38`	`40`	`)`
`39`	`41`
`40`		`-state=CommandState.from_sea_state(status_data.get("state",""))`
`41`		`-ifstateisNone:`
`42`		`-raiseValueError(f"Invalid state:{status_data.get('state','')}")`
`43`	`42`	`status=StatementStatus(`
`44`		`-state=state,`
	`43`	`+state=CommandState.from_sea_state(status_data.get("state","")),`
`45`	`44`	`error=error,`
`46`	`45`	`sql_state=status_data.get("sql_state"),`
`47`	`46`	`)`
`48`	`47`
	`48`	`+# Parse manifest`
	`49`	`+manifest=None`
	`50`	`+if"manifest"indata:`
	`51`	`+manifest_data=data["manifest"]`
	`52`	`+manifest=ResultManifest(`
	`53`	`+format=manifest_data.get("format",""),`
	`54`	`+schema=manifest_data.get("schema", {}),`
	`55`	`+total_row_count=manifest_data.get("total_row_count",0),`
	`56`	`+total_byte_count=manifest_data.get("total_byte_count",0),`
	`57`	`+total_chunk_count=manifest_data.get("total_chunk_count",0),`
	`58`	`+truncated=manifest_data.get("truncated",False),`
	`59`	`+chunks=manifest_data.get("chunks"),`
	`60`	`+result_compression=manifest_data.get("result_compression"),`
	`61`	`+ )`
	`62`	`+`
	`63`	`+# Parse result data`
	`64`	`+result=None`
	`65`	`+if"result"indata:`
	`66`	`+result_data=data["result"]`
	`67`	`+external_links=None`
	`68`	`+`
	`69`	`+if"external_links"inresult_data:`
	`70`	`+external_links= []`
	`71`	`+forlink_datainresult_data["external_links"]:`
	`72`	`+external_links.append(`
	`73`	`+ExternalLink(`
	`74`	`+external_link=link_data.get("external_link",""),`
	`75`	`+expiration=link_data.get("expiration",""),`
	`76`	`+chunk_index=link_data.get("chunk_index",0),`
	`77`	`+byte_count=link_data.get("byte_count",0),`
	`78`	`+row_count=link_data.get("row_count",0),`
	`79`	`+row_offset=link_data.get("row_offset",0),`
	`80`	`+next_chunk_index=link_data.get("next_chunk_index"),`
	`81`	`+next_chunk_internal_link=link_data.get(`
	`82`	`+"next_chunk_internal_link"`
	`83`	`+ ),`
	`84`	`+http_headers=link_data.get("http_headers"),`
	`85`	`+ )`
	`86`	`+ )`
	`87`	`+`
	`88`	`+result=ResultData(`
	`89`	`+data=result_data.get("data_array"),`
	`90`	`+external_links=external_links,`
	`91`	`+ )`
	`92`	`+`
`49`	`93`	`returncls(`
`50`	`94`	`statement_id=data.get("statement_id",""),`
`51`	`95`	`status=status,`
`52`		`-manifest=data.get("manifest"),# We'll parse this more fully if needed`
`53`		`-result=data.get("result"),# We'll parse this more fully if needed`
	`96`	`+manifest=manifest,`
	`97`	`+result=result,`
`54`	`98`	`)`
`55`	`99`
`56`	`100`
`@@ -75,21 +119,62 @@ def from_dict(cls, data: Dict[str, Any]) -> "GetStatementResponse":`
`75`	`119`	`error_code=error_data.get("error_code"),`
`76`	`120`	`)`
`77`	`121`
`78`		`-state=CommandState.from_sea_state(status_data.get("state",""))`
`79`		`-ifstateisNone:`
`80`		`-raiseValueError(f"Invalid state:{status_data.get('state','')}")`
`81`		`-`
`82`	`122`	`status=StatementStatus(`
`83`		`-state=state,`
	`123`	`+state=CommandState.from_sea_state(status_data.get("state","")),`
`84`	`124`	`error=error,`
`85`	`125`	`sql_state=status_data.get("sql_state"),`
`86`	`126`	`)`
`87`	`127`
	`128`	`+# Parse manifest`
	`129`	`+manifest=None`
	`130`	`+if"manifest"indata:`
	`131`	`+manifest_data=data["manifest"]`
	`132`	`+manifest=ResultManifest(`
	`133`	`+format=manifest_data.get("format",""),`
	`134`	`+schema=manifest_data.get("schema", {}),`
	`135`	`+total_row_count=manifest_data.get("total_row_count",0),`
	`136`	`+total_byte_count=manifest_data.get("total_byte_count",0),`
	`137`	`+total_chunk_count=manifest_data.get("total_chunk_count",0),`
	`138`	`+truncated=manifest_data.get("truncated",False),`
	`139`	`+chunks=manifest_data.get("chunks"),`
	`140`	`+result_compression=manifest_data.get("result_compression"),`
	`141`	`+ )`
	`142`	`+`
	`143`	`+# Parse result data`
	`144`	`+result=None`
	`145`	`+if"result"indata:`
	`146`	`+result_data=data["result"]`
	`147`	`+external_links=None`
	`148`	`+`
	`149`	`+if"external_links"inresult_data:`
	`150`	`+external_links= []`
	`151`	`+forlink_datainresult_data["external_links"]:`
	`152`	`+external_links.append(`
	`153`	`+ExternalLink(`
	`154`	`+external_link=link_data.get("external_link",""),`
	`155`	`+expiration=link_data.get("expiration",""),`
	`156`	`+chunk_index=link_data.get("chunk_index",0),`
	`157`	`+byte_count=link_data.get("byte_count",0),`
	`158`	`+row_count=link_data.get("row_count",0),`
	`159`	`+row_offset=link_data.get("row_offset",0),`
	`160`	`+next_chunk_index=link_data.get("next_chunk_index"),`
	`161`	`+next_chunk_internal_link=link_data.get(`
	`162`	`+"next_chunk_internal_link"`
	`163`	`+ ),`
	`164`	`+http_headers=link_data.get("http_headers"),`
	`165`	`+ )`
	`166`	`+ )`
	`167`	`+`
	`168`	`+result=ResultData(`
	`169`	`+data=result_data.get("data_array"),`
	`170`	`+external_links=external_links,`
	`171`	`+ )`
	`172`	`+`
`88`	`173`	`returncls(`
`89`	`174`	`statement_id=data.get("statement_id",""),`
`90`	`175`	`status=status,`
`91`		`-manifest=data.get("manifest"),# We'll parse this more fully if needed`
`92`		`-result=data.get("result"),# We'll parse this more fully if needed`
	`176`	`+manifest=manifest,`
	`177`	`+result=result,`
`93`	`178`	`)`
`94`	`179`
`95`	`180`
`@@ -103,3 +188,38 @@ class CreateSessionResponse:`
`103`	`188`	`deffrom_dict(cls,data:Dict[str,Any])->"CreateSessionResponse":`
`104`	`189`	`"""Create a CreateSessionResponse from a dictionary."""`
`105`	`190`	`returncls(session_id=data.get("session_id",""))`
	`191`	`+`
	`192`	`+`
	`193`	`+@dataclass`
	`194`	`+classGetChunksResponse:`
	`195`	`+"""Response from getting chunks for a statement."""`
	`196`	`+`
	`197`	`+statement_id:str`
	`198`	`+external_links:List[ExternalLink]`
	`199`	`+`
	`200`	`+@classmethod`
	`201`	`+deffrom_dict(cls,data:Dict[str,Any])->"GetChunksResponse":`
	`202`	`+"""Create a GetChunksResponse from a dictionary."""`
	`203`	`+external_links= []`
	`204`	`+if"external_links"indata:`
	`205`	`+forlink_dataindata["external_links"]:`
	`206`	`+external_links.append(`
	`207`	`+ExternalLink(`
	`208`	`+external_link=link_data.get("external_link",""),`
	`209`	`+expiration=link_data.get("expiration",""),`
	`210`	`+chunk_index=link_data.get("chunk_index",0),`
	`211`	`+byte_count=link_data.get("byte_count",0),`
	`212`	`+row_count=link_data.get("row_count",0),`
	`213`	`+row_offset=link_data.get("row_offset",0),`
	`214`	`+next_chunk_index=link_data.get("next_chunk_index"),`
	`215`	`+next_chunk_internal_link=link_data.get(`
	`216`	`+"next_chunk_internal_link"`
	`217`	`+ ),`
	`218`	`+http_headers=link_data.get("http_headers"),`
	`219`	`+ )`
	`220`	`+ )`
	`221`	`+`
	`222`	`+returncls(`
	`223`	`+statement_id=data.get("statement_id",""),`
	`224`	`+external_links=external_links,`
	`225`	`+ )`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit4cb15fd

File tree

4 files changed

4 files changed

`‎src/databricks/sql/backend/filters.py‎`

`‎src/databricks/sql/backend/sea/models/base.py‎`

`‎src/databricks/sql/backend/sea/models/requests.py‎`

`‎src/databricks/sql/backend/sea/models/responses.py‎`

0 commit comments