-
Notifications
You must be signed in to change notification settings - Fork 4.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
fix postgres data handling from WAL logs in CDC mode (#15481)
* fix postgres data handling from WAL logs in CDC mode * format * use formatter for dates also (#15485) * format * change test structure * change log to debug Co-authored-by: Edward Gao <edward.gao@airbyte.io>
- Loading branch information
1 parent
fdb5eb9
commit 0092712
Showing
13 changed files
with
387 additions
and
169 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
131 changes: 131 additions & 0 deletions
131
airbyte-db/db-lib/src/main/java/io/airbyte/db/jdbc/DateTimeConverter.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,131 @@ | ||
/* | ||
* Copyright (c) 2022 Airbyte, Inc., all rights reserved. | ||
*/ | ||
|
||
package io.airbyte.db.jdbc; | ||
|
||
import static io.airbyte.db.DataTypeUtils.DATE_FORMATTER; | ||
import static io.airbyte.db.DataTypeUtils.TIMESTAMPTZ_FORMATTER; | ||
import static io.airbyte.db.DataTypeUtils.TIMESTAMP_FORMATTER; | ||
import static io.airbyte.db.DataTypeUtils.TIMETZ_FORMATTER; | ||
import static io.airbyte.db.DataTypeUtils.TIME_FORMATTER; | ||
import static io.airbyte.db.jdbc.AbstractJdbcCompatibleSourceOperations.resolveEra; | ||
import static java.time.ZoneOffset.UTC; | ||
|
||
import java.sql.Date; | ||
import java.sql.Time; | ||
import java.sql.Timestamp; | ||
import java.time.Duration; | ||
import java.time.Instant; | ||
import java.time.LocalDate; | ||
import java.time.LocalDateTime; | ||
import java.time.LocalTime; | ||
import java.time.OffsetDateTime; | ||
import java.time.OffsetTime; | ||
import java.time.ZonedDateTime; | ||
import java.time.format.DateTimeFormatter; | ||
import java.util.concurrent.TimeUnit; | ||
import org.slf4j.Logger; | ||
import org.slf4j.LoggerFactory; | ||
|
||
public class DateTimeConverter { | ||
|
||
private static final Logger LOGGER = LoggerFactory.getLogger(DateTimeConverter.class); | ||
public static final DateTimeFormatter TIME_WITH_TIMEZONE_FORMATTER = DateTimeFormatter.ofPattern( | ||
"HH:mm:ss[.][SSSSSSSSS][SSSSSSS][SSSSSS][SSSSS][SSSS][SSS][SS][S][''][XXX][XX][X]"); | ||
|
||
public static String convertToTimeWithTimezone(final Object time) { | ||
if (time instanceof final java.time.OffsetTime timetz) { | ||
return timetz.format(TIMETZ_FORMATTER); | ||
} | ||
final OffsetTime timetz = OffsetTime.parse(time.toString(), TIME_WITH_TIMEZONE_FORMATTER); | ||
return timetz.format(TIMETZ_FORMATTER); | ||
} | ||
|
||
public static String convertToTimestampWithTimezone(final Object timestamp) { | ||
if (timestamp instanceof final Timestamp t) { | ||
// In snapshot mode, debezium produces a java.sql.Timestamp object for the TIMESTAMPTZ type. | ||
// Conceptually, a timestamp with timezone is an Instant. But t.toInstant() actually mangles the | ||
// value for ancient dates, because leap years weren't applied consistently in ye olden days. | ||
// Additionally, toInstant() (and toLocalDateTime()) actually lose the era indicator, so we can't | ||
// rely on their getEra() methods. | ||
// So we have special handling for this case, which sidesteps the toInstant conversion. | ||
final ZonedDateTime timestamptz = t.toLocalDateTime().atZone(UTC); | ||
final String value = timestamptz.format(TIMESTAMPTZ_FORMATTER); | ||
return resolveEra(t, value); | ||
} else if (timestamp instanceof final OffsetDateTime t) { | ||
return resolveEra(t.toLocalDate(), t.format(TIMESTAMPTZ_FORMATTER)); | ||
} else if (timestamp instanceof final ZonedDateTime timestamptz) { | ||
return resolveEra(timestamptz.toLocalDate(), timestamptz.format(TIMESTAMPTZ_FORMATTER)); | ||
} else { | ||
// This case probably isn't strictly necessary, but I'm leaving it just in case there's some weird | ||
// situation that I'm not aware of. | ||
final Instant instant = Instant.parse(timestamp.toString()); | ||
final OffsetDateTime offsetDateTime = OffsetDateTime.ofInstant(instant, UTC); | ||
final ZonedDateTime timestamptz = ZonedDateTime.from(offsetDateTime); | ||
final LocalDate localDate = timestamptz.toLocalDate(); | ||
final String value = timestamptz.format(TIMESTAMPTZ_FORMATTER); | ||
return resolveEra(localDate, value); | ||
} | ||
} | ||
|
||
/** | ||
* See {@link #convertToTimestampWithTimezone(Object)} for explanation of the weird things happening | ||
* here. | ||
*/ | ||
public static String convertToTimestamp(final Object timestamp) { | ||
if (timestamp instanceof final Timestamp t) { | ||
// Snapshot mode | ||
final LocalDateTime localDateTime = t.toLocalDateTime(); | ||
final String value = localDateTime.format(TIMESTAMP_FORMATTER); | ||
return resolveEra(t, value); | ||
} else if (timestamp instanceof final Instant i) { | ||
// Incremental mode | ||
return resolveEra(i.atZone(UTC).toLocalDate(), i.atOffset(UTC).toLocalDateTime().format(TIMESTAMP_FORMATTER)); | ||
} else { | ||
final LocalDateTime localDateTime = LocalDateTime.parse(timestamp.toString()); | ||
final LocalDate date = localDateTime.toLocalDate(); | ||
final String value = localDateTime.format(TIMESTAMP_FORMATTER); | ||
return resolveEra(date, value); | ||
} | ||
} | ||
|
||
/** | ||
* See {@link #convertToTimestampWithTimezone(Object)} for explanation of the weird things happening | ||
* here. | ||
*/ | ||
public static String convertToDate(final Object date) { | ||
if (date instanceof final Date d) { | ||
// Snapshot mode | ||
final LocalDate localDate = ((Date) date).toLocalDate(); | ||
return resolveEra(d, localDate.format(DATE_FORMATTER)); | ||
} else if (date instanceof LocalDate d) { | ||
// Incremental mode | ||
return resolveEra(d, d.format(DATE_FORMATTER)); | ||
} else { | ||
final LocalDate localDate = LocalDate.parse(date.toString()); | ||
return resolveEra(localDate, localDate.format(DATE_FORMATTER)); | ||
} | ||
} | ||
|
||
public static String convertToTime(final Object time) { | ||
if (time instanceof final Time sqlTime) { | ||
return sqlTime.toLocalTime().format(TIME_FORMATTER); | ||
} else if (time instanceof final LocalTime localTime) { | ||
return localTime.format(TIME_FORMATTER); | ||
} else if (time instanceof java.time.Duration) { | ||
long value = ((Duration) time).toNanos(); | ||
if (value >= 0 && value <= TimeUnit.DAYS.toNanos(1)) { | ||
return LocalTime.ofNanoOfDay(value).format(TIME_FORMATTER); | ||
} else { | ||
final long updatedValue = 0 > value ? Math.abs(value) : TimeUnit.DAYS.toNanos(1); | ||
LOGGER.debug("Time values must use number of milliseconds greater than 0 and less than 86400000000000 but its {}, converting to {} ", value, | ||
updatedValue); | ||
return LocalTime.ofNanoOfDay(updatedValue).format(TIME_FORMATTER); | ||
} | ||
} else { | ||
return LocalTime.parse(time.toString()).format(TIME_FORMATTER); | ||
} | ||
} | ||
|
||
} |
122 changes: 0 additions & 122 deletions
122
...um-v1-9-2/src/main/java/io/airbyte/integrations/debezium/internals/DateTimeConverter.java
This file was deleted.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.