Skip to content

Commit

Permalink
Merge pull request #531 from gnieh/json/jq/null
Browse files Browse the repository at this point in the history
Add a default fallback value to paths
  • Loading branch information
satabin authored Oct 5, 2023
2 parents 9545f33 + 9cb328f commit 628dd71
Show file tree
Hide file tree
Showing 8 changed files with 117 additions and 36 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@ object Query {
case class ForClause[Tag, Path](variable: String, source: Path, result: Query[Tag, Path]) extends Query[Tag, Path]
case class LetClause[Tag, Path](variable: String, query: Query[Tag, Path], result: Query[Tag, Path])
extends Query[Tag, Path]
case class Ordpath[Tag, Path](path: Path) extends Query[Tag, Path]
case class Ordpath[Tag, Path](path: Path, default: Option[Tag]) extends Query[Tag, Path]
case class Variable[Tag, Path](name: String) extends Query[Tag, Path]
case class Node[Tag, Path](tag: Tag, child: Query[Tag, Path]) extends Query[Tag, Path]
case class Leaf[Tag, Path](tag: Tag) extends Query[Tag, Path]
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -18,10 +18,11 @@ package fs2.data
package mft
package query

import pfsa.{Candidate, Pred, Regular}
import cats.Eq
import cats.syntax.all._
import cats.data.NonEmptyList
import cats.syntax.all._

import pfsa.{Candidate, Pred, Regular}

/** This compiler can be used to compile to an MFT any query language that can be represented by nested for loops.
*
Expand Down Expand Up @@ -82,7 +83,10 @@ private[fs2] abstract class QueryCompiler[InTag, OutTag, Path] {
// input is copied in the first argument
q0(any) -> qinit(x0, qcopy(x0))

def translatePath(path: Path, start: builder.StateBuilder, end: builder.StateBuilder): Unit = {
def translatePath(path: Path,
default: Rhs[OutTag],
start: builder.StateBuilder,
end: builder.StateBuilder): Unit = {
val regular = path2regular(path)
val dfa = regular.deriveDFA
// resolve transitions into patterns and guards
Expand Down Expand Up @@ -114,6 +118,7 @@ private[fs2] abstract class QueryCompiler[InTag, OutTag, Path] {
val states2 =
transitions.foldLeft(states1) { case (states, (pattern, guard, tgt)) =>
val finalTgt = dfa.finals.contains(tgt)
val trapTgt = dfa.trap.contains(tgt)
val (q2, states1) =
states.get(tgt) match {
case Some(q2) => (q2, states)
Expand All @@ -122,14 +127,16 @@ private[fs2] abstract class QueryCompiler[InTag, OutTag, Path] {
(q2, states.updated(tgt, q2))
}
val pat: builder.Guardable = tagOf(pattern).fold(anyNode)(aNode(_))
if (!finalTgt) {
q1(pat.when(guard)) -> q2(x1, copyArgs: _*) ~ q1(x2, copyArgs: _*)
if (trapTgt) {
q1(pat.when(guard)) -> (if (default == eps) q2(x1, copyArgs: _*) ~ q1(x2, copyArgs: _*) else default)
} else if (!finalTgt) {
q1(pat.when(guard)) -> q2(x1, copyArgs: _*) ~ (if (default == eps) q1(x2, copyArgs: _*) else eps)
} else if (emitSelected) {
q1(pat.when(guard)) -> end(x1, (copyArgs :+ copy(qcopy(x1))): _*) ~ q2(x1, copyArgs: _*) ~
q1(x2, copyArgs: _*)
(if (default == eps) q1(x2, copyArgs: _*) else eps)
} else {
q1(pat.when(guard)) -> end(x1, (copyArgs :+ qcopy(x1)): _*) ~ q2(x1, copyArgs: _*) ~
q1(x2, copyArgs: _*)
(if (default == eps) q1(x2, copyArgs: _*) else eps)
}
states1
}
Expand All @@ -148,7 +155,7 @@ private[fs2] abstract class QueryCompiler[InTag, OutTag, Path] {
val q1 = state(args = q.nargs + 1)

// compile the variable binding path
translatePath(source, q, q1)
translatePath(source, eps, q, q1)

// then the body with the bound variable
translate(result, variable :: vars, q1)
Expand All @@ -166,11 +173,11 @@ private[fs2] abstract class QueryCompiler[InTag, OutTag, Path] {
val copyArgs = List.tabulate(q.nargs)(y(_))
q(any) -> q1(x0, (copyArgs :+ qv(x0, copyArgs: _*)): _*)

case Query.Ordpath(path) =>
case Query.Ordpath(path, default) =>
val q1 = state(args = q.nargs + 1)

// compile the path
translatePath(path, q, q1)
translatePath(path, default.map(leaf(_)).getOrElse(eps), q, q1)

// emit the result
q1(any) -> y(q.nargs)
Expand Down
6 changes: 4 additions & 2 deletions finite-state/shared/src/main/scala/fs2/data/pfsa/PDFA.scala
Original file line number Diff line number Diff line change
Expand Up @@ -21,8 +21,10 @@ import cats.syntax.foldable._

import Pred.syntax._

private[data] class PDFA[P, T](val init: Int, val finals: Set[Int], val transitions: Array[List[(P, Int)]])(implicit
P: Pred[P, T]) {
private[data] class PDFA[P, T](val init: Int,
val finals: Set[Int],
val trap: Option[Int],
val transitions: Array[List[(P, Int)]])(implicit P: Pred[P, T]) {

def step(q: Int, t: T): Option[Int] =
if (q >= transitions.length)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -76,6 +76,7 @@ private[data] class PNFA[P, T](val init: Int, val finals: Set[Int], val transiti
case Nil =>
new PDFA[P, T](0,
newFinals.map(newStates(_)),
None,
newTransitions.result().map(_.map { case (p, q) => (p, newStates(q)) }))
case q :: qs =>
if (newStates.contains(q)) {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -194,8 +194,10 @@ sealed abstract class Regular[CharSet] {
}

val (qs, transitions) = explore(Chain.one(this), Map.empty, this)
val finals = qs.zipWithIndex.collect { case (re, idx) if re.acceptEpsilon => idx }.toList.toSet
new PDFA[CharSet, C](0, finals, Array.tabulate(qs.size.toInt)(transitions.getOrElse(_, Nil)))
val indexedStates = qs.zipWithIndex
val finals = indexedStates.collect { case (re, idx) if re.acceptEpsilon => idx }.toList.toSet
val trap = indexedStates.collectFirst { case (Regular.Chars(cs), idx) if cs === never => idx }
new PDFA[CharSet, C](0, finals, trap, Array.tabulate(qs.size.toInt)(transitions.getOrElse(_, Nil)))
}

}
Expand Down
23 changes: 12 additions & 11 deletions finite-state/shared/src/test/scala/fs2/data/mft/QuerySpec.scala
Original file line number Diff line number Diff line change
Expand Up @@ -116,7 +116,7 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {

test("child path") {
MiniXQueryCompiler
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Child(Some("a"))))), credit)
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Child(Some("a")))), None), credit)
.esp[IO]
.flatMap { esp =>
Stream
Expand Down Expand Up @@ -163,7 +163,7 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {

test("any child path") {
MiniXQueryCompiler
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Child(None)))), credit)
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Child(None))), None), credit)
.esp[IO]
.flatMap { esp =>
Stream
Expand Down Expand Up @@ -210,7 +210,7 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {

test("descendant path") {
MiniXQueryCompiler
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("a"))))), credit)
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("a")))), None), credit)
.esp[IO]
.flatMap { esp =>
Stream
Expand Down Expand Up @@ -267,7 +267,7 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {

test("any descendant path") {
MiniXQueryCompiler
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(None)))), credit)
.compile(Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(None))), None), credit)
.esp[IO]
.flatMap { esp =>
Stream
Expand Down Expand Up @@ -326,10 +326,11 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {

test("simple let") {
MiniXQueryCompiler
.compile(
Query
.LetClause("v", Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("a"))))), Query.Variable("v")),
credit)
.compile(Query
.LetClause("v",
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("a")))), None),
Query.Variable("v")),
credit)
.esp[IO]
.flatMap { esp =>
Stream
Expand Down Expand Up @@ -662,10 +663,10 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {
MiniXPath(NonEmptyList.one(Step.Descendant(Some("b")))),
Query.LetClause(
"v3",
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("c"))))),
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("c")))), None),
Query.LetClause(
"v4",
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("d"))))),
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("d")))), None),
Query.Sequence(NonEmptyList
.of(Query.Variable("v1"), Query.Variable("v2"), Query.Variable("v3"), Query.Variable("v4")))
)
Expand Down Expand Up @@ -781,7 +782,7 @@ abstract class QuerySpec(credit: Int) extends SimpleIOSuite {
.compile(
Query.LetClause(
"a",
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("a"))))),
Query.Ordpath(MiniXPath(NonEmptyList.one(Step.Descendant(Some("a")))), None),
Query.ForClause(
"b",
MiniXPath(NonEmptyList.one(Step.Descendant(Some("b")))),
Expand Down
22 changes: 12 additions & 10 deletions json/src/main/scala/fs2/data/json/jq/internal/ESPJqCompiler.scala
Original file line number Diff line number Diff line change
Expand Up @@ -34,6 +34,8 @@ private[jq] class ESPJqCompiler[F[_]](implicit F: MonadThrow[F], defer: Defer[F]

override protected val emitSelected: Boolean = false

private val default: Option[TaggedJson] = Some(TaggedJson.Raw(Token.NullValue))

private type State[T] = StateT[F, Int, T]

private val nextIdent: State[String] =
Expand Down Expand Up @@ -223,7 +225,7 @@ private[jq] class ESPJqCompiler[F[_]](implicit F: MonadThrow[F], defer: Defer[F]
}
}

private def preprocess(prefix: Filter, jq: Jq): State[Query[TaggedJson, Filter]] =
private def preprocess(prefix: Filter, jq: Jq, withDefault: Boolean): State[Query[TaggedJson, Filter]] =
jq match {
case Jq.Null =>
pure(Query.Leaf(TaggedJson.Raw(Token.NullValue)))
Expand All @@ -232,7 +234,7 @@ private[jq] class ESPJqCompiler[F[_]](implicit F: MonadThrow[F], defer: Defer[F]
case Jq.Arr(prefix1, values) =>
values.zipWithIndex
.traverse { case (elt, idx) =>
preprocess(prefix ~ prefix1, elt).map(q => Query.Node(TaggedJson.StartArrayElement(idx), q))
preprocess(prefix ~ prefix1, elt, false).map(q => Query.Node(TaggedJson.StartArrayElement(idx), q))
}
.map { elts =>
Query.Node(TaggedJson.Raw(Token.StartArray),
Expand All @@ -256,10 +258,10 @@ private[jq] class ESPJqCompiler[F[_]](implicit F: MonadThrow[F], defer: Defer[F]
case Some(v) =>
Query.node[TaggedJson, Filter](TaggedJson.StartObjectValue(name), Query.variable(v)).pure[State]
case None =>
preprocess(prefix ~ prefix1, elt).map(q => Query.node(TaggedJson.StartObjectValue(name), q))
preprocess(prefix ~ prefix1, elt, true).map(q => Query.node(TaggedJson.StartObjectValue(name), q))
}
else
preprocess(prefix ~ prefix1, elt).map(q => Query.node(TaggedJson.StartObjectValue(name), q))
preprocess(prefix ~ prefix1, elt, true).map(q => Query.node(TaggedJson.StartObjectValue(name), q))
}.map { elts =>
Query.Node(TaggedJson.Raw(Token.StartObject),
NonEmptyList.fromList(elts).fold(Query.empty[TaggedJson, Filter])(Query.Sequence(_)))
Expand All @@ -273,15 +275,15 @@ private[jq] class ESPJqCompiler[F[_]](implicit F: MonadThrow[F], defer: Defer[F]
if (elt == Jq.Identity)
Query.Variable[TaggedJson, Filter](v).pure[State]
else
preprocess(prefix ~ prefix1, elt)
preprocess(prefix ~ prefix1, elt, true)
} yield (v, Query.Node(TaggedJson.StartObjectValue(name), q))
}
v <- nextIdent
inner <-
if (inner == Jq.Identity)
Query.Variable[TaggedJson, Filter](v).pure[State]
else
preprocess(Jq.Identity, inner)
preprocess(Jq.Identity, inner, true)
} yield {
val (before, after) = values.splitAt(idx)
val forClause: Query[TaggedJson, Filter] =
Expand All @@ -306,20 +308,20 @@ private[jq] class ESPJqCompiler[F[_]](implicit F: MonadThrow[F], defer: Defer[F]
case Jq.Iterator(filter, inner: Constructor) =>
for {
v <- nextIdent
inner <- preprocess(Jq.Identity, inner)
inner <- preprocess(Jq.Identity, inner, withDefault)
} yield Query.ForClause(v, prefix ~ filter ~ Jq.Child, inner)
case Jq.Iterator(filter, inner) =>
for {
v <- nextIdent
inner <- preprocess(Jq.Child, inner)
inner <- preprocess(Jq.Child, inner, withDefault)
} yield Query.ForClause(v, prefix ~ filter, inner)
case filter: Filter =>
pure(Query.Ordpath(prefix ~ filter))
pure(Query.Ordpath(prefix ~ filter, if (withDefault) default else None))
}

def compile(jq: Jq): F[Pipe[F, Token, Token]] =
for {
query <- preprocess(Jq.Root, jq).runA(0)
query <- preprocess(Jq.Root, jq, false).runA(0)
mft = compile(query)
esp <- mft.esp
} yield new ESPCompiledJq[F](esp)
Expand Down
66 changes: 66 additions & 0 deletions json/src/test/scala/fs2/data/json/jq/JqSpec.scala
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,34 @@ object JqSpec extends SimpleIOSuite {
} yield expect.same(List(Token.NumberValue("0")), result)
}

test("select not found") {
for {
compiled <- compiler.compile(jq".a[0].d.e")
result <- input.through(compiled).compile.toList
} yield expect.same(Nil, result)
}

test("iterate not found") {
for {
compiled <- compiler.compile(jq""".d[]""")
result <- input.through(compiled).compile.toList
} yield expect.same(Nil, result)
}

test("iterate object not found") {
for {
compiled <- compiler.compile(jq""".d[] | { "value": .a }""")
result <- input.through(compiled).compile.toList
} yield expect.same(Nil, result)
}

test("iterate array not found") {
for {
compiled <- compiler.compile(jq"""[ .d[] ]""")
result <- input.through(compiled).compile.toList
} yield expect.same(List(Token.StartArray, Token.EndArray), result)
}

test("simple recursive descent") {
for {
compiled <- compiler.compile(jq"..")
Expand Down Expand Up @@ -355,4 +383,42 @@ object JqSpec extends SimpleIOSuite {
)
}

test("not found value constructor") {
for {
compiled <- compiler.compile(jq"""{ "value": .a[0].d }""")
result <- input.through(compiled).compile.toList
} yield expect.same(
List(
Token.StartObject,
Token.Key("value"),
Token.NullValue,
Token.EndObject
),
result
)
}

test("not found value object iterator") {
for {
compiled <- compiler.compile(jq"""{ "value": .a[].unknown }""")
result <- input.through(compiled).compile.toList
} yield expect.same(
List(
Token.StartObject,
Token.Key("value"),
Token.NullValue,
Token.EndObject,
Token.StartObject,
Token.Key("value"),
Token.NullValue,
Token.EndObject,
Token.StartObject,
Token.Key("value"),
Token.NullValue,
Token.EndObject
),
result
)
}

}

0 comments on commit 628dd71

Please # to comment.