Skip to content

[Compiler plugin] Propagate nullability in toDataFrame tree conversion #942

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 2 commits into from
Nov 8, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,12 @@ import org.jetbrains.kotlin.fir.symbols.SymbolInternals
import org.jetbrains.kotlin.fir.symbols.impl.ConeClassLikeLookupTagImpl
import org.jetbrains.kotlin.fir.symbols.impl.FirPropertySymbol
import org.jetbrains.kotlin.fir.types.ConeClassLikeType
import org.jetbrains.kotlin.fir.types.ConeFlexibleType
import org.jetbrains.kotlin.fir.types.ConeKotlinType
import org.jetbrains.kotlin.fir.types.ConeNullability
import org.jetbrains.kotlin.fir.types.ConeStarProjection
import org.jetbrains.kotlin.fir.types.ConeTypeParameterType
import org.jetbrains.kotlin.fir.types.ConeTypeProjection
import org.jetbrains.kotlin.fir.types.canBeNull
import org.jetbrains.kotlin.fir.types.classId
import org.jetbrains.kotlin.fir.types.coneType
Expand All @@ -41,15 +44,18 @@ import org.jetbrains.kotlin.fir.types.resolvedType
import org.jetbrains.kotlin.fir.types.toRegularClassSymbol
import org.jetbrains.kotlin.fir.types.toSymbol
import org.jetbrains.kotlin.fir.types.type
import org.jetbrains.kotlin.fir.types.typeContext
import org.jetbrains.kotlin.fir.types.upperBoundIfFlexible
import org.jetbrains.kotlin.fir.types.withArguments
import org.jetbrains.kotlin.fir.types.withNullability
import org.jetbrains.kotlin.name.ClassId
import org.jetbrains.kotlin.name.FqName
import org.jetbrains.kotlin.name.Name
import org.jetbrains.kotlin.name.StandardClassIds
import org.jetbrains.kotlin.name.StandardClassIds.List
import org.jetbrains.kotlinx.dataframe.codeGen.*
import org.jetbrains.kotlinx.dataframe.plugin.extensions.KotlinTypeFacade
import org.jetbrains.kotlinx.dataframe.plugin.extensions.wrap
import org.jetbrains.kotlinx.dataframe.plugin.impl.AbstractInterpreter
import org.jetbrains.kotlinx.dataframe.plugin.impl.AbstractSchemaModificationInterpreter
import org.jetbrains.kotlinx.dataframe.plugin.impl.Arguments
Expand All @@ -71,27 +77,31 @@ import java.util.*
class ToDataFrameDsl : AbstractSchemaModificationInterpreter() {
val Arguments.receiver: FirExpression? by arg(lens = Interpreter.Id)
val Arguments.body by dsl()
val Arguments.typeArg0: ConeTypeProjection? by arg(lens = Interpreter.Id)

override fun Arguments.interpret(): PluginDataFrameSchema {
val dsl = CreateDataFrameDslImplApproximation()
body(dsl, mapOf("explicitReceiver" to Interpreter.Success(receiver)))
body(dsl, mapOf("typeArg0" to Interpreter.Success(typeArg0)))
return PluginDataFrameSchema(dsl.columns)
}
}

class ToDataFrame : AbstractSchemaModificationInterpreter() {
val Arguments.receiver: FirExpression? by arg(lens = Interpreter.Id)
val Arguments.maxDepth: Number by arg(defaultValue = Present(DEFAULT_MAX_DEPTH))
val Arguments.typeArg0: ConeTypeProjection by arg(lens = Interpreter.Id)

override fun Arguments.interpret(): PluginDataFrameSchema {
return toDataFrame(maxDepth.toInt(), receiver, TraverseConfiguration())
return toDataFrame(maxDepth.toInt(), typeArg0, TraverseConfiguration())
}
}

class ToDataFrameDefault : AbstractSchemaModificationInterpreter() {
val Arguments.receiver: FirExpression? by arg(lens = Interpreter.Id)
val Arguments.typeArg0: ConeTypeProjection by arg(lens = Interpreter.Id)

override fun Arguments.interpret(): PluginDataFrameSchema {
return toDataFrame(DEFAULT_MAX_DEPTH, receiver, TraverseConfiguration())
return toDataFrame(DEFAULT_MAX_DEPTH, typeArg0, TraverseConfiguration())
}
}

Expand All @@ -109,14 +119,14 @@ private const val DEFAULT_MAX_DEPTH = 0

class Properties0 : AbstractInterpreter<Unit>() {
val Arguments.dsl: CreateDataFrameDslImplApproximation by arg()
val Arguments.explicitReceiver: FirExpression? by arg()
val Arguments.maxDepth: Int by arg()
val Arguments.body by dsl()
val Arguments.typeArg0: ConeTypeProjection by arg(lens = Interpreter.Id)

override fun Arguments.interpret() {
dsl.configuration.maxDepth = maxDepth
body(dsl.configuration.traverseConfiguration, emptyMap())
val schema = toDataFrame(dsl.configuration.maxDepth, explicitReceiver, dsl.configuration.traverseConfiguration)
val schema = toDataFrame(dsl.configuration.maxDepth, typeArg0, dsl.configuration.traverseConfiguration)
dsl.columns.addAll(schema.columns())
}
}
Expand Down Expand Up @@ -172,8 +182,8 @@ class Exclude1 : AbstractInterpreter<Unit>() {
@OptIn(SymbolInternals::class)
internal fun KotlinTypeFacade.toDataFrame(
maxDepth: Int,
explicitReceiver: FirExpression?,
traverseConfiguration: TraverseConfiguration
arg: ConeTypeProjection,
traverseConfiguration: TraverseConfiguration,
): PluginDataFrameSchema {
fun ConeKotlinType.isValueType() =
this.isArrayTypeOrNullableArrayType ||
Expand All @@ -197,7 +207,7 @@ internal fun KotlinTypeFacade.toDataFrame(
val preserveClasses = traverseConfiguration.preserveClasses.mapNotNullTo(mutableSetOf()) { it.classId }
val preserveProperties = traverseConfiguration.preserveProperties.mapNotNullTo(mutableSetOf()) { it.calleeReference.toResolvedPropertySymbol() }

fun convert(classLike: ConeKotlinType, depth: Int): List<SimpleCol> {
fun convert(classLike: ConeKotlinType, depth: Int, makeNullable: Boolean): List<SimpleCol> {
val symbol = classLike.toRegularClassSymbol(session) ?: return emptyList()
val scope = symbol.unsubstitutedScope(session, ScopeSession(), false, FirResolvePhase.STATUS)
val declarations = if (symbol.fir is FirJavaClass) {
Expand Down Expand Up @@ -260,7 +270,7 @@ internal fun KotlinTypeFacade.toDataFrame(

val keepSubtree = depth >= maxDepth && !fieldKind.shouldBeConvertedToColumnGroup && !fieldKind.shouldBeConvertedToFrameColumn
if (keepSubtree || returnType.isValueType() || returnType.classId in preserveClasses || it in preserveProperties) {
SimpleDataColumn(name, TypeApproximation(returnType))
SimpleDataColumn(name, TypeApproximation(returnType.withNullability(ConeNullability.create(makeNullable), session.typeContext)))
} else if (
returnType.isSubtypeOf(StandardClassIds.Iterable.constructClassLikeType(arrayOf(ConeStarProjection)), session) ||
returnType.isSubtypeOf(StandardClassIds.Iterable.constructClassLikeType(arrayOf(ConeStarProjection), isNullable = true), session)
Expand All @@ -271,30 +281,28 @@ internal fun KotlinTypeFacade.toDataFrame(
else -> session.builtinTypes.nullableAnyType.type
}
if (type.isValueType()) {
SimpleDataColumn(name,
TypeApproximation(
List.constructClassLikeType(
arrayOf(type),
returnType.isNullable
)
)
)
val columnType = List.constructClassLikeType(arrayOf(type), returnType.isNullable)
.withNullability(ConeNullability.create(makeNullable), session.typeContext)
.wrap()
SimpleDataColumn(name, columnType)
} else {
SimpleFrameColumn(name, convert(type, depth + 1))
SimpleFrameColumn(name, convert(type, depth + 1, makeNullable = false))
}
} else {
SimpleColumnGroup(name, convert(returnType, depth + 1))
SimpleColumnGroup(name, convert(returnType, depth + 1, returnType.isNullable || makeNullable))
}
}
}

val receiver = explicitReceiver ?: return PluginDataFrameSchema.EMPTY
val arg = receiver.resolvedType.typeArguments.firstOrNull() ?: return PluginDataFrameSchema.EMPTY
return when {
arg.isStarProjection -> PluginDataFrameSchema.EMPTY
else -> {
val classLike = arg.type as? ConeClassLikeType ?: return PluginDataFrameSchema.EMPTY
val columns = convert(classLike, 0)
val classLike = when (val type = arg.type) {
is ConeClassLikeType -> type
is ConeFlexibleType -> type.upperBound
else -> null
} ?: return PluginDataFrameSchema.EMPTY
val columns = convert(classLike, 0, makeNullable = classLike.isNullable)
PluginDataFrameSchema(columns)
}
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -90,29 +90,43 @@ fun <T> KotlinTypeFacade.interpret(
val refinedArguments: RefinedArguments = functionCall.collectArgumentExpressions()

val defaultArguments = processor.expectedArguments.filter { it.defaultValue is Present }.map { it.name }.toSet()
val actualArgsMap = refinedArguments.associateBy { it.name.identifier }.toSortedMap()
val conflictingKeys = additionalArguments.keys intersect actualArgsMap.keys
val actualValueArguments = refinedArguments.associateBy { it.name.identifier }.toSortedMap()
val conflictingKeys = additionalArguments.keys intersect actualValueArguments.keys
if (conflictingKeys.isNotEmpty()) {
if (isTest) {
interpretationFrameworkError("Conflicting keys: $conflictingKeys")
}
return null
}
val expectedArgsMap = processor.expectedArguments
.filterNot { it.name.startsWith("typeArg") }
.associateBy { it.name }.toSortedMap().minus(additionalArguments.keys)

val unexpectedArguments = expectedArgsMap.keys - defaultArguments != actualArgsMap.keys - defaultArguments
val typeArguments = buildMap {
functionCall.typeArguments.forEachIndexed { index, firTypeProjection ->
val key = "typeArg$index"
val lens = expectedArgsMap[key]?.lens ?: return@forEachIndexed
val value: Any = if (lens == Interpreter.Id) {
firTypeProjection.toConeTypeProjection()
} else {
val type = firTypeProjection.toConeTypeProjection().type ?: session.builtinTypes.nullableAnyType.type
if (type is ConeIntersectionType) return@forEachIndexed
Marker(type)
}
put(key, Interpreter.Success(value))
}
}

val unexpectedArguments = (expectedArgsMap.keys - defaultArguments) != (actualValueArguments.keys + typeArguments.keys - defaultArguments)
if (unexpectedArguments) {
if (isTest) {
val message = buildString {
appendLine("ERROR: Different set of arguments")
appendLine("Implementation class: $processor")
appendLine("Not found in actual: ${expectedArgsMap.keys - actualArgsMap.keys}")
val diff = actualArgsMap.keys - expectedArgsMap.keys
appendLine("Not found in actual: ${expectedArgsMap.keys - actualValueArguments.keys}")
val diff = actualValueArguments.keys - expectedArgsMap.keys
appendLine("Passed, but not expected: ${diff}")
appendLine("add arguments to an interpeter:")
appendLine(diff.map { actualArgsMap[it] })
appendLine(diff.map { actualValueArguments[it] })
}
interpretationFrameworkError(message)
}
Expand All @@ -121,6 +135,7 @@ fun <T> KotlinTypeFacade.interpret(

val arguments = mutableMapOf<String, Interpreter.Success<Any?>>()
arguments += additionalArguments
arguments += typeArguments
val interpretationResults = refinedArguments.refinedArguments.mapNotNull {
val name = it.name.identifier
val expectedArgument = expectedArgsMap[name] ?: error("$processor $name")
Expand Down Expand Up @@ -269,17 +284,6 @@ fun <T> KotlinTypeFacade.interpret(
value?.let { value1 -> it.name.identifier to value1 }
}

functionCall.typeArguments.forEachIndexed { index, firTypeProjection ->
val type = firTypeProjection.toConeTypeProjection().type ?: session.builtinTypes.nullableAnyType.type
if (type is ConeIntersectionType) return@forEachIndexed
// val approximation = TypeApproximationImpl(
// type.classId!!.asFqNameString(),
// type.isMarkedNullable
// )
val approximation = Marker(type)
arguments["typeArg$index"] = Interpreter.Success(approximation)
}

return if (interpretationResults.size == refinedArguments.refinedArguments.size) {
arguments.putAll(interpretationResults)
when (val res = processor.interpret(arguments, this)) {
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,29 @@
import org.jetbrains.kotlinx.dataframe.*
import org.jetbrains.kotlinx.dataframe.annotations.*
import org.jetbrains.kotlinx.dataframe.api.*
import org.jetbrains.kotlinx.dataframe.io.*

@DataSchema
data class D(
val s: String
)

class Subtree(
val p: Int,
val l: List<Int>,
val ld: List<D>,
)

class Root(val a: Subtree)

class MyList(val l: List<Root?>): List<Root?> by l

fun box(): String {
val l = listOf(
Root(Subtree(123, listOf(1), listOf(D("ff")))),
null
)
val df = MyList(l).toDataFrame(maxDepth = 2)
df.compareSchemas(strict = true)
return "OK"
}
16 changes: 16 additions & 0 deletions plugins/kotlin-dataframe/testData/box/toDataFrame_nullableList.kt
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
import org.jetbrains.kotlinx.dataframe.*
import org.jetbrains.kotlinx.dataframe.annotations.*
import org.jetbrains.kotlinx.dataframe.api.*
import org.jetbrains.kotlinx.dataframe.io.*

@DataSchema
data class D(
val s: String
)

fun box(): String {
val df1 = listOf(D("bb"), null).toDataFrame()
df1.schema().print()
df1.compileTimeSchema().print()
return "OK"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
import org.jetbrains.kotlinx.dataframe.*
import org.jetbrains.kotlinx.dataframe.annotations.*
import org.jetbrains.kotlinx.dataframe.api.*
import org.jetbrains.kotlinx.dataframe.io.*

@DataSchema
data class D(
val s: String
)

class Subtree(
val p: Int,
val l: List<Int>,
val ld: List<D>,
)

class Root(val a: Subtree)

fun box(): String {
val l = listOf(
Root(Subtree(123, listOf(1), listOf(D("ff")))),
null
)
val df = l.toDataFrame(maxDepth = 2)
df.compareSchemas(strict = true)
return "OK"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
import org.jetbrains.kotlinx.dataframe.*
import org.jetbrains.kotlinx.dataframe.annotations.*
import org.jetbrains.kotlinx.dataframe.api.*
import org.jetbrains.kotlinx.dataframe.io.*

@DataSchema
data class D(
val s: String
)

class Subtree(
val p: Int,
val l: List<Int>,
val ld: List<D>,
)

class Root(val a: Subtree?)

fun box(): String {
val l = listOf(
Root(Subtree(123, listOf(1), listOf(D("ff")))),
Root(null)
)
val df = l.toDataFrame(maxDepth = 2)
df.compareSchemas(strict = true)
return "OK"
}
Original file line number Diff line number Diff line change
Expand Up @@ -418,6 +418,12 @@ public void testToDataFrame_column() {
runTest("testData/box/toDataFrame_column.kt");
}

@Test
@TestMetadata("toDataFrame_customIterable.kt")
public void testToDataFrame_customIterable() {
runTest("testData/box/toDataFrame_customIterable.kt");
}

@Test
@TestMetadata("toDataFrame_dataSchema.kt")
public void testToDataFrame_dataSchema() {
Expand All @@ -436,6 +442,24 @@ public void testToDataFrame_from() {
runTest("testData/box/toDataFrame_from.kt");
}

@Test
@TestMetadata("toDataFrame_nullableList.kt")
public void testToDataFrame_nullableList() {
runTest("testData/box/toDataFrame_nullableList.kt");
}

@Test
@TestMetadata("toDataFrame_nullableListSubtree.kt")
public void testToDataFrame_nullableListSubtree() {
runTest("testData/box/toDataFrame_nullableListSubtree.kt");
}

@Test
@TestMetadata("toDataFrame_nullableSubtree.kt")
public void testToDataFrame_nullableSubtree() {
runTest("testData/box/toDataFrame_nullableSubtree.kt");
}

@Test
@TestMetadata("toDataFrame_superType.kt")
public void testToDataFrame_superType() {
Expand Down