From a14140be104281c8e4181a1a20dcea6691087189 Mon Sep 17 00:00:00 2001 From: Pawel Leszczynski Date: Thu, 1 Dec 2022 08:56:55 +0100 Subject: [PATCH] allow nullable column type in column-lineaeg Signed-off-by: Pawel Leszczynski --- CHANGELOG.md | 6 ++++++ .../marquez/db/mappers/ColumnLineageNodeDataMapper.java | 2 +- .../java/marquez/db/models/ColumnLineageNodeData.java | 2 +- api/src/test/java/marquez/db/ColumnLineageDaoTest.java | 9 +++++++++ 4 files changed, 17 insertions(+), 2 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 613a070524..f0da110030 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,9 +1,15 @@ # Changelog ## [Unreleased](https://github.com/MarquezProject/marquez/compare/0.28.0...HEAD) + +### Added + * Column-lineage endpoints supports point-in-time requests [`#2265`](https://github.com/MarquezProject/marquez/pull/2265) [@pawel-big-lebowski](https://github.com/pawel-big-lebowski) *Enable requesting `column-lineage` endpoint by a dataset version, job version or dataset field of a specific dataset version.* +### Fixed + +* Allow null column type in column-lineage [`#2272`](https://github.com/MarquezProject/marquez/pull/2272) [@pawel-big-lebowski](https://github.com/pawel-big-lebowski) * Include error message for JSON processing exception [`#2271`](https://github.com/MarquezProject/marquez/pull/2271) [@pawel-big-lebowski](https://github.com/pawel-big-lebowski) *In case of JSON processing exceptions Marquez API should return exception message to a client.* diff --git a/api/src/main/java/marquez/db/mappers/ColumnLineageNodeDataMapper.java b/api/src/main/java/marquez/db/mappers/ColumnLineageNodeDataMapper.java index cc24e74f76..0c7ef15b32 100644 --- a/api/src/main/java/marquez/db/mappers/ColumnLineageNodeDataMapper.java +++ b/api/src/main/java/marquez/db/mappers/ColumnLineageNodeDataMapper.java @@ -39,7 +39,7 @@ public ColumnLineageNodeData map(ResultSet results, StatementContext ctx) throws stringOrThrow(results, Columns.DATASET_NAME), uuidOrThrow(results, Columns.DATASET_VERSION_UUID), stringOrThrow(results, Columns.FIELD_NAME), - stringOrThrow(results, Columns.TYPE), + stringOrNull(results, Columns.TYPE), stringOrNull(results, TRANSFORMATION_DESCRIPTION), stringOrNull(results, TRANSFORMATION_TYPE), toInputFields(results, "inputFields")); diff --git a/api/src/main/java/marquez/db/models/ColumnLineageNodeData.java b/api/src/main/java/marquez/db/models/ColumnLineageNodeData.java index 43f3137cbe..88431bb48f 100644 --- a/api/src/main/java/marquez/db/models/ColumnLineageNodeData.java +++ b/api/src/main/java/marquez/db/models/ColumnLineageNodeData.java @@ -19,7 +19,7 @@ public class ColumnLineageNodeData implements NodeData { @NonNull String dataset; @Nullable UUID datasetVersion; @NonNull String field; - @NonNull String fieldType; + @Nullable String fieldType; String transformationDescription; String transformationType; @NonNull List inputFields; diff --git a/api/src/test/java/marquez/db/ColumnLineageDaoTest.java b/api/src/test/java/marquez/db/ColumnLineageDaoTest.java index c84ec5bb14..e0571f3562 100644 --- a/api/src/test/java/marquez/db/ColumnLineageDaoTest.java +++ b/api/src/test/java/marquez/db/ColumnLineageDaoTest.java @@ -474,6 +474,15 @@ void testGetLineageWhenJobRunMultipleTimes() { .isEqualTo(lineageRow.getInputs().get().get(0).getDatasetVersionRow().getUuid()); } + @Test + void testGetLineageWhenDataTypeIsEmpty() { + Dataset datasetWithNullDataType = getDatasetB(); + datasetWithNullDataType.getFacets().getSchema().getFields().get(0).setType(null); + + UpdateLineageRow lineageRow = createLineage(openLineageDao, dataset_A, datasetWithNullDataType); + getColumnLineage(lineageRow, "col_c"); + } + private Set getColumnLineage(UpdateLineageRow lineageRow, String field) { UpdateLineageRow.DatasetRecord datasetRecord = lineageRow.getOutputs().get().get(0); UUID field_UUID = fieldDao.findUuid(datasetRecord.getDatasetRow().getUuid(), field).get();