Skip to content

Commit

Permalink
[CALCITE-6210] Cast to VARBINARY causes an assertion failure
Browse files Browse the repository at this point in the history
Signed-off-by: Mihai Budiu <mbudiu@feldera.com>
  • Loading branch information
mihaibudiu committed Apr 10, 2024
1 parent 889f416 commit aba64f0
Show file tree
Hide file tree
Showing 10 changed files with 67 additions and 16 deletions.
4 changes: 2 additions & 2 deletions babel/src/test/resources/sql/redshift.iq
Original file line number Diff line number Diff line change
Expand Up @@ -1777,7 +1777,7 @@ SELECT "LENGTH"('ily')

-- returns 8 (cf OCTET_LENGTH)
select length('français');
SELECT "LENGTH"(u&'fran\00e7ais')
SELECT "LENGTH"('français')
!explain-validated-on calcite

# LOWER
Expand Down Expand Up @@ -1824,7 +1824,7 @@ f7415e33f972c03abd4f3fed36748f7a
# OCTET_LENGTH
-- returns 9 (cf LENGTH)
select octet_length('français');
SELECT OCTET_LENGTH(CAST(u&'fran\00e7ais' AS VARBINARY))
SELECT OCTET_LENGTH(CAST('français' AS VARBINARY))
!explain-validated-on calcite

# POSITION is a synonym for STRPOS
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -80,6 +80,7 @@
import java.lang.reflect.Modifier;
import java.lang.reflect.Type;
import java.math.BigDecimal;
import java.nio.charset.Charset;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
Expand Down Expand Up @@ -308,6 +309,18 @@ private Expression getConvertExpression(
case ANY:
return operand;

case VARBINARY:
case BINARY:
switch (sourceType.getSqlTypeName()) {
case CHAR:
case VARCHAR:
return Expressions.call(BuiltInMethod.STRING_TO_BINARY.method, operand,
new ConstantExpression(Charset.class, sourceType.getCharset()));

default:
return defaultExpression.get();
}

case GEOMETRY:
switch (sourceType.getSqlTypeName()) {
case CHAR:
Expand Down
3 changes: 2 additions & 1 deletion core/src/main/java/org/apache/calcite/rex/RexUtil.java
Original file line number Diff line number Diff line change
Expand Up @@ -1683,7 +1683,8 @@ public static boolean isLosslessCast(RexNode node) {
*
* @param source source type
* @param target target type
* @return true iff the conversion is a loss-less cast
* @return 'true' when the conversion can certainly be determined to be loss-less cast,
* but may return 'false' for some lossless casts.
*/
@API(since = "1.22", status = API.Status.EXPERIMENTAL)
public static boolean isLosslessCast(RelDataType source, RelDataType target) {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4575,6 +4575,14 @@ public static int time(long timestampMillis, String timeZone) {
}
}

public static @PolyNull ByteString stringToBinary(@PolyNull String s, Charset charset) {
if (s == null) {
return null;
} else {
return new ByteString(s.getBytes(charset));
}
}

/** Helper for CAST(... AS VARBINARY(maxLength)). */
public static @PolyNull ByteString truncate(@PolyNull ByteString s, int maxLength) {
if (s == null) {
Expand Down
16 changes: 6 additions & 10 deletions core/src/main/java/org/apache/calcite/sql/SqlDialect.java
Original file line number Diff line number Diff line change
Expand Up @@ -433,17 +433,13 @@ public final String quoteStringLiteral(String val) {
*/
public void quoteStringLiteral(StringBuilder buf, @Nullable String charsetName,
String val) {
if (containsNonAscii(val) && charsetName == null) {
quoteStringLiteralUnicode(buf, val);
} else {
if (charsetName != null) {
buf.append("_");
buf.append(charsetName);
}
buf.append(literalQuoteString);
buf.append(val.replace(literalEndQuoteString, literalEscapedQuote));
buf.append(literalEndQuoteString);
if (charsetName != null) {
buf.append("_");
buf.append(charsetName);
}
buf.append(literalQuoteString);
buf.append(val.replace(literalEndQuoteString, literalEscapedQuote));
buf.append(literalEndQuoteString);
}

public void unparseCall(SqlWriter writer, SqlCall call, int leftPrec,
Expand Down
2 changes: 2 additions & 0 deletions core/src/main/java/org/apache/calcite/util/BuiltInMethod.java
Original file line number Diff line number Diff line change
Expand Up @@ -124,6 +124,7 @@
import java.lang.reflect.Field;
import java.lang.reflect.Method;
import java.math.BigDecimal;
import java.nio.charset.Charset;
import java.sql.ResultSet;
import java.sql.Time;
import java.sql.Timestamp;
Expand Down Expand Up @@ -604,6 +605,7 @@ public enum BuiltInMethod {
String.class, TimeZone.class),
STRING_TO_TIMESTAMP_WITH_LOCAL_TIME_ZONE(SqlFunctions.class, "toTimestampWithLocalTimeZone",
String.class),
STRING_TO_BINARY(SqlFunctions.class, "stringToBinary", String.class, Charset.class),
TIMESTAMP_STRING_TO_TIMESTAMP_WITH_LOCAL_TIME_ZONE(SqlFunctions.class,
"toTimestampWithLocalTimeZone", String.class, TimeZone.class),
TIME_WITH_LOCAL_TIME_ZONE_TO_TIME(SqlFunctions.class, "timeWithLocalTimeZoneToTime",
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7020,7 +7020,7 @@ private void checkLiteral2(String expression, String expected) {
final String expected0 = "SELECT JSON_INSERT(\"product_name\", '$', 10)\n"
+ "FROM \"foodmart\".\"product\"";
final String expected1 = "SELECT JSON_INSERT(NULL, '$', 10, '$', NULL, '$', "
+ "u&'\\000a\\0009\\000a')\nFROM \"foodmart\".\"product\"";
+ "'\n\t\n')\nFROM \"foodmart\".\"product\"";
sql(query0).ok(expected0);
sql(query1).ok(expected1);
}
Expand All @@ -7032,7 +7032,7 @@ private void checkLiteral2(String expression, String expected) {
final String expected = "SELECT JSON_REPLACE(\"product_name\", '$', 10)\n"
+ "FROM \"foodmart\".\"product\"";
final String expected1 = "SELECT JSON_REPLACE(NULL, '$', 10, '$', NULL, '$', "
+ "u&'\\000a\\0009\\000a')\nFROM \"foodmart\".\"product\"";
+ "'\n\t\n')\nFROM \"foodmart\".\"product\"";
sql(query).ok(expected);
sql(query1).ok(expected1);
}
Expand All @@ -7044,7 +7044,7 @@ private void checkLiteral2(String expression, String expected) {
final String expected = "SELECT JSON_SET(\"product_name\", '$', 10)\n"
+ "FROM \"foodmart\".\"product\"";
final String expected1 = "SELECT JSON_SET(NULL, '$', 10, '$', NULL, '$', "
+ "u&'\\000a\\0009\\000a')\nFROM \"foodmart\".\"product\"";
+ "'\n\t\n')\nFROM \"foodmart\".\"product\"";
sql(query).ok(expected);
sql(query1).ok(expected1);
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,7 @@
import java.lang.reflect.Type;
import java.math.BigDecimal;
import java.math.BigInteger;
import java.nio.charset.Charset;
import java.util.Arrays;
import java.util.List;
import java.util.Map;
Expand Down Expand Up @@ -208,6 +209,12 @@ private static ExpressionWriter write(ExpressionWriter writer,
if (value instanceof Set) {
return writeSet(writer, (Set) value);
}
if (value instanceof Charset) {
writer.append("java.nio.charset.Charset.forName(\"");
writer.append(value);
writer.append("\")");
return writer;
}

Constructor constructor = matchingConstructor(value);
if (constructor != null) {
Expand Down
5 changes: 5 additions & 0 deletions site/_docs/reference.md
Original file line number Diff line number Diff line change
Expand Up @@ -1478,6 +1478,11 @@ Algorithms for implicit conversion are subject to change across Calcite releases
| CONVERT(value USING transcodingName) | Alter *value* from one base character set to *transcodingName*
| TRANSLATE(value USING transcodingName) | Alter *value* from one base character set to *transcodingName*

Converting a string to a **BINARY** or **VARBINARY** type produces the
list of bytes of the string's encoding in the strings' charset. A
runtime error is produced if the string's characters cannot be
represented using its charset.

Supported data types syntax:

{% highlight sql %}
Expand Down
19 changes: 19 additions & 0 deletions testkit/src/main/java/org/apache/calcite/test/SqlOperatorTest.java
Original file line number Diff line number Diff line change
Expand Up @@ -707,6 +707,25 @@ void testCastToExactNumeric(CastType castType, SqlOperatorFixture f) {
"CHAR(1) NOT NULL", "3");
}

/**
* Test case for <a href="https://issues.apache.org/jira/browse/CALCITE-6210">
* Cast to VARBINARY causes an assertion failure</a>. */
@Test public void testVarbinaryCast() {
SqlOperatorFixture f = fixture();
f.checkScalar("CAST('00' AS VARBINARY)", "3030", "VARBINARY NOT NULL");
f.checkScalar("CAST('help' AS VARBINARY)", "68656c70", "VARBINARY NOT NULL");
f.checkScalar("CAST('help' AS VARBINARY(2))", "6865", "VARBINARY(2) NOT NULL");
f.checkScalar("CAST('00' AS BINARY(1))", "30", "BINARY(1) NOT NULL");
f.checkScalar("CAST('10' AS BINARY(2))", "3130", "BINARY(2) NOT NULL");
f.checkScalar("CAST('10' AS BINARY(1))", "31", "BINARY(1) NOT NULL");
f.checkScalar("CAST('10' AS BINARY(3))", "313000", "BINARY(3) NOT NULL");
f.checkScalar("CAST(_UTF8'Hello ਸੰਸਾਰ!' AS VARBINARY)",
"48656c6c6f20e0a8b8e0a9b0e0a8b8e0a8bee0a8b021", "VARBINARY NOT NULL");
f.checkFails("CAST('Hello ਸੰਸਾਰ!' AS VARBINARY)",
".*Failed to encode .* in character set 'ISO-8859-1'", true);
f.checkNull("CAST(CAST(NULL AS VARCHAR) AS VARBINARY)");
}

@ParameterizedTest
@MethodSource("safeParameters")
void testCastStringToDecimal(CastType castType, SqlOperatorFixture f) {
Expand Down

0 comments on commit aba64f0

Please sign in to comment.