mirror of
https://github.com/PostHog/posthog.git
synced 2024-11-24 00:47:50 +01:00
fix(data-warehouse): Fix for missing table_format on dlt resources (#24411)
This commit is contained in:
parent
22e689c8f3
commit
dee5ca103c
@ -21,6 +21,7 @@ from posthog.warehouse.data_load.validate_schema import validate_schema_and_upda
|
|||||||
from posthog.warehouse.models.external_data_job import ExternalDataJob, get_external_data_job
|
from posthog.warehouse.models.external_data_job import ExternalDataJob, get_external_data_job
|
||||||
from posthog.warehouse.models.external_data_schema import ExternalDataSchema, aget_schema_by_id
|
from posthog.warehouse.models.external_data_schema import ExternalDataSchema, aget_schema_by_id
|
||||||
from posthog.warehouse.models.external_data_source import ExternalDataSource
|
from posthog.warehouse.models.external_data_source import ExternalDataSource
|
||||||
|
from posthog.warehouse.models.table import DataWarehouseTable
|
||||||
from posthog.warehouse.s3 import get_s3_client
|
from posthog.warehouse.s3 import get_s3_client
|
||||||
|
|
||||||
|
|
||||||
@ -160,6 +161,12 @@ class DataImportPipeline:
|
|||||||
if total_counts.total() > 0:
|
if total_counts.total() > 0:
|
||||||
delta_tables = get_delta_tables(pipeline)
|
delta_tables = get_delta_tables(pipeline)
|
||||||
|
|
||||||
|
table_format = DataWarehouseTable.TableFormat.DeltaS3Wrapper
|
||||||
|
|
||||||
|
# Workaround while we fix msising table_format on DLT resource
|
||||||
|
if len(delta_tables.values()) == 0:
|
||||||
|
table_format = DataWarehouseTable.TableFormat.Delta
|
||||||
|
|
||||||
# There should only ever be one table here
|
# There should only ever be one table here
|
||||||
for table in delta_tables.values():
|
for table in delta_tables.values():
|
||||||
table.optimize.compact()
|
table.optimize.compact()
|
||||||
@ -174,6 +181,7 @@ class DataImportPipeline:
|
|||||||
schema_id=self.inputs.schema_id,
|
schema_id=self.inputs.schema_id,
|
||||||
table_schema=self.source.schema.tables,
|
table_schema=self.source.schema.tables,
|
||||||
row_count=total_counts.total(),
|
row_count=total_counts.total(),
|
||||||
|
table_format=table_format,
|
||||||
)
|
)
|
||||||
|
|
||||||
pipeline_runs = pipeline_runs + 1
|
pipeline_runs = pipeline_runs + 1
|
||||||
@ -208,6 +216,12 @@ class DataImportPipeline:
|
|||||||
if total_counts.total() > 0:
|
if total_counts.total() > 0:
|
||||||
delta_tables = get_delta_tables(pipeline)
|
delta_tables = get_delta_tables(pipeline)
|
||||||
|
|
||||||
|
table_format = DataWarehouseTable.TableFormat.DeltaS3Wrapper
|
||||||
|
|
||||||
|
# Workaround while we fix msising table_format on DLT resource
|
||||||
|
if len(delta_tables.values()) == 0:
|
||||||
|
table_format = DataWarehouseTable.TableFormat.Delta
|
||||||
|
|
||||||
# There should only ever be one table here
|
# There should only ever be one table here
|
||||||
for table in delta_tables.values():
|
for table in delta_tables.values():
|
||||||
table.optimize.compact()
|
table.optimize.compact()
|
||||||
@ -222,6 +236,7 @@ class DataImportPipeline:
|
|||||||
schema_id=self.inputs.schema_id,
|
schema_id=self.inputs.schema_id,
|
||||||
table_schema=self.source.schema.tables,
|
table_schema=self.source.schema.tables,
|
||||||
row_count=total_counts.total(),
|
row_count=total_counts.total(),
|
||||||
|
table_format=table_format,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Delete local state from the file system
|
# Delete local state from the file system
|
||||||
|
@ -72,6 +72,7 @@ async def validate_schema_and_update_table(
|
|||||||
schema_id: uuid.UUID,
|
schema_id: uuid.UUID,
|
||||||
table_schema: TSchemaTables,
|
table_schema: TSchemaTables,
|
||||||
row_count: int,
|
row_count: int,
|
||||||
|
table_format: DataWarehouseTable.TableFormat,
|
||||||
) -> None:
|
) -> None:
|
||||||
"""
|
"""
|
||||||
|
|
||||||
@ -117,7 +118,7 @@ async def validate_schema_and_update_table(
|
|||||||
table_params = {
|
table_params = {
|
||||||
"credential": credential,
|
"credential": credential,
|
||||||
"name": table_name,
|
"name": table_name,
|
||||||
"format": DataWarehouseTable.TableFormat.DeltaS3Wrapper,
|
"format": table_format,
|
||||||
"url_pattern": new_url_pattern,
|
"url_pattern": new_url_pattern,
|
||||||
"team_id": team_id,
|
"team_id": team_id,
|
||||||
"row_count": row_count,
|
"row_count": row_count,
|
||||||
|
Loading…
Reference in New Issue
Block a user