JSONPath: Query expressions for JSON

all authors

$['store']['book'][0]['title']

$.store.book[0].title

$.store.book[?@.price < 10].title

{ "store": {
    "book": [
      { "category": "reference",
        "author": "Nigel Rees",
        "title": "Sayings of the Century",
        "price": 8.95
      },
      { "category": "fiction",
        "author": "Evelyn Waugh",
        "title": "Sword of Honour",
        "price": 12.99
      },
      { "category": "fiction",
        "author": "Herman Melville",
        "title": "Moby Dick",
        "isbn": "0-553-21311-3",
        "price": 8.99
      },
      { "category": "fiction",
        "author": "J. R. R. Tolkien",
        "title": "The Lord of the Rings",
        "isbn": "0-395-19395-8",
        "price": 22.99
      }
    ],
    "bicycle": {
      "color": "red",
      "price": 19.95
    }
  }
}

json-path = root-identifier *(S (child-segment               /
                                 descendant-segment))

root-identifier  = "$"

{"k": "v"}

selector =  ( name-selector  /
              index-selector /
              slice-selector /
              filter-selector
            )

name-selector       = string-literal

string-literal      = %x22 *double-quoted %x22 /       ; "string"
                      %x27 *single-quoted %x27         ; 'string'

double-quoted       = unescaped /
                      %x27      /                       ; '
                      ESC %x22  /                       ; \"
                      ESC escapable

single-quoted       = unescaped /
                      %x22      /                       ; "
                      ESC %x27  /                       ; \'
                      ESC escapable

ESC                 = %x5C                              ; \  backslash

unescaped           = %x20-21 /                         ; s. RFC 8259
                      %x23-26 /                         ; omit "
                      %x28-5B /                         ; omit '
                      %x5D-10FFFF                       ; omit \

escapable           = ( %x62 / %x66 / %x6E / %x72 / %x74 / ; \b \f \n \r \t
                          ; b /         ;  BS backspace U+0008
                          ; t /         ;  HT horizontal tab U+0009
                          ; n /         ;  LF line feed U+000A
                          ; f /         ;  FF form feed U+000C
                          ; r /         ;  CR carriage return U+000D
                          "/" /          ;  /  slash (solidus) U+002F
                          "\" /          ;  \  backslash (reverse solidus) U+005C
                          (%x75 hexchar) ;  uXXXX      U+XXXX
                      )

hexchar = non-surrogate / (high-surrogate "\" %x75 low-surrogate)
non-surrogate = ((DIGIT / "A"/"B"/"C" / "E"/"F") 3HEXDIG) /
                 ("D" %x30-37 2HEXDIG )
high-surrogate = "D" ("8"/"9"/"A"/"B") 2HEXDIG
low-surrogate = "D" ("C"/"D"/"E"/"F") 2HEXDIG

HEXDIG = DIGIT / "A" / "B" / "C" / "D" / "E" / "F"

; Task from 2021-06-15 interim: update ABNF later

{
  "o": {"j j": {"k.k": 3}},
  "'": {"@": 2}
}

wildcard = "*"

{
  "o": {"j": 1, "k": 2},
  "a": [5, 3]
}

index-selector  = int                             ; decimal integer

int             = ["-"] ( "0" / (DIGIT1 *DIGIT) ) ; -  optional
DIGIT1          = %x31-39                         ; 1-9 non-zero digit

["a","b"]

slice-selector =  [start S] ":" S [end S] [":" [S step ]]

start          = int       ; included in selection
end            = int       ; not included in selection
step           = int       ; default: 1

B              =    %x20 / ; Space
                    %x09 / ; Horizontal tab
                    %x0A / ; Line feed or New line
                    %x0D   ; Carriage return
S              = *B        ; optional blank space
RS             = 1*B       ; required blank space


FUNCTION Normalize(i, len):
  IF i >= 0 THEN
    RETURN i
  ELSE
    RETURN len + i
  END IF

FUNCTION Bounds(start, end, step, len):
  n_start = Normalize(start, len)
  n_end = Normalize(end, len)

  IF step >= 0 THEN
    lower = MIN(MAX(n_start, 0), len)
    upper = MIN(MAX(n_end, 0), len)
  ELSE
    upper = MIN(MAX(n_start, -1), len-1)
    lower = MIN(MAX(n_end, -1), len-1)
  END IF

  RETURN (lower, upper)

IF step > 0 THEN

  i = lower
  WHILE i < upper:
    SELECT a(i)
    i = i + step
  END WHILE

ELSE if step < 0 THEN

  i = upper
  WHILE lower < i:
    SELECT a(i)
    i = i + step
  END WHILE

END IF

["a", "b", "c", "d", "e", "f", "g"]

filter-selector = "?" S boolean-expr

boolean-expr     = logical-or-expr
logical-or-expr  = logical-and-expr *(S "||" S logical-and-expr)
                                                      ; disjunction
                                                      ; binds less tightly than conjunction
logical-and-expr = basic-expr *(S "&&" S basic-expr)  ; conjunction
                                                      ; binds more tightly than disjunction

basic-expr        = exist-expr /
                    paren-expr /
                    relation-expr
exist-expr        = [logical-not-op S] singular-path  ; path existence or non-existence

singular-path     = rel-singular-path / abs-singular-path
rel-singular-path = "@" *(S (name-segment / index-segment))
abs-singular-path = root-identifier *(S (name-segment / index-segment))
name-segment      = "[" name-selector "]" / dot-member-name-shorthand
index-segment     = "[" index-selector "]"

paren-expr        = [logical-not-op S] "(" S boolean-expr S ")"
                                                      ; parenthesized expression
logical-not-op    = "!"                               ; logical NOT operator

relation-expr = comp-expr /                           ; comparison test
                regex-expr                            ; regular expression test

comp-expr    = comparable S comp-op S comparable
comparable   = number / string-literal /              ; primitive ...
               true / false / null /                  ; values only
               singular-path                          ; Singular Path value
comp-op      = "==" / "!=" /                          ; comparison ...
               "<"  / ">"  /                          ; operators
               "<=" / ">="

number       = int [ frac ] [ exp ]                   ; decimal number
frac         = "." 1*DIGIT                            ; decimal fraction
exp          = "e" [ "-" / "+" ] 1*DIGIT              ; decimal exponent
true         = %x74.72.75.65                          ; true
false        = %x66.61.6c.73.65                       ; false
null         = %x6e.75.6c.6c                          ; null

regex-expr   = (singular-path / string-literal) S regex-op S regex
regex-op     = "=~"                                   ; regular expression match
regex        = string-literal                         ; I-Regexp

{
  "obj": {"x": "y"},
  "arr": [2, 3]
}

{
  "a": [3, 5, 1, 2, 4, 6, {"b": "j"}, {"b": "k"}],
  "o": {"p": 1, "q": 2, "r": 3, "s": 5, "t": {"u": 6}}
}

child-segment             = (child-longhand /
                             dot-wildcard-shorthand /
                             dot-member-name-shorthand)

child-longhand            = "[" S selector 1*(S "," S selector) S "]"

dot-wildcard-shorthand    = "." wildcard

dot-member-name-shorthand = "." dot-member-name
dot-member-name           = name-first *name-char
name-first                = ALPHA /
                            "_"   /            ; _
                            %x80-10FFFF        ; any non-ASCII Unicode character
name-char                 = DIGIT / name-first

DIGIT                     =  %x30-39              ; 0-9
ALPHA                     =  %x41-5A / %x61-7A    ; A-Z / a-z

descendant-segment               = (descendant-child /
                                    descendant-wildcard-shorthand /
                                    descendant-member-name-shorthand)
descendant-child                 = ".." child-segment

descendant-wildcard-shorthand    = ".." wildcard
descendant-member-name-shorthand = ".." dot-member-name

{
  "o": {"j": 1, "k": 2},
  "a": [5, 3, [{"j": 4}]]
}

{"a": null, "b": [null], "c": [{}], "null": 1}

normalized-path           = root-identifier *(normal-index-segment)
normal-index-segment      = "[" (normal-name-selector / normal-index-selector) "]"
normal-name-selector      = %x27 *normal-single-quoted %x27 ; 'string'
normal-single-quoted      = normal-unescaped /
                            ESC normal-escapable
normal-unescaped          = %x20-26 /                       ; omit control codes
                            %x28-5B /                       ; omit '
                            %x5D-10FFFF                     ; omit \
normal-escapable          = ( %x62 / %x66 / %x6E / %x72 / %x74 / ; \b \f \n \r \t
                                ; b /         ;  BS backspace U+0008
                                ; t /         ;  HT horizontal tab U+0009
                                ; n /         ;  LF line feed U+000A
                                ; f /         ;  FF form feed U+000C
                                ; r /         ;  CR carriage return U+000D
                                "'" /         ;  ' apostrophe U+0027
                                "\" /         ;  \ backslash (reverse solidus) U+005C
                                (%x75 normal-hexchar) ;  certain values u00xx U+00XX
                            )
normal-hexchar            = "0" "0"
                            (
                              ("0" %x30-37) / ; "00"-"07"
                              ("0" %x62) /    ; "0b"      ; omit U+0008-U+000A
                              ("0" %x65-66) /  ; "0e"-"0f" ; omit U+000C-U+000D
                              ("1" normal-HEXDIG)
                            )
normal-HEXDIG             = DIGIT / %x61-66   ; "0"-"9", "a"-"f"
normal-index-selector     = "0" / (DIGIT1 *DIGIT) ; non-negative decimal integer

/store/book[1]/title

x.store.book[0].title

x['store']['book'][0]['title']

$.store.book[?(@.price < 10)].title

Internet-Draft	JSONPath	October 2022
Gössner, et al.	Expires 20 April 2023	[Page]

JSONPath	Description
`$`	root node identifier (Section 3.4)
`@`	current node identifier (Section 3.5.5) (valid only within filter selectors)
`[<selectors>]`	child segment (Section 3.6.1) selects zero or more children of JSON objects and arrays; contains one or more selectors, separated by commas
`..[<selectors>]`	descendant segment (Section 3.6.2): selects zero or more descendants of JSON objects and arrays; contains one or more selectors, separated by commas
`'name'`	name selector (Section 3.5.1): selects a named child of an object
`*`	wildcard selector (Section 3.5.1): selects all children of an array or object
`3`	index selector (Section 3.5.3): selects an indexed child of an array (from 0)
`0:100:5`	array slice selector (Section 3.5.4): start:end:step for arrays
`?<expr>`	filter selector (Section 3.5.5): selects particular children using a boolean expression
`.name`	shorthand for `['name']`
`.*`	shorthand for `[*]`
`..name`	shorthand for `..['name']`
`..*`	shorthand for `..[*]`

JSONPath	Intended result
`$.store.book[*].author`	the authors of all books in the store
`$..author`	all authors
`$.store.*`	all things in store, which are some books and a red bicycle
`$.store..price`	the prices of everything in the store
`$..book[2]`	the third book
`$..book[-1]`	the last book in order
`$..book[0,1]` `$..book[:2]`	the first two books
`$..book[?(@.isbn)]`	filter all books with ISBN number
`$..book[?(@.price<10)]`	filter all books cheaper than 10
`$..*`	all member values and array elements contained in input value

Query	Result	Result Paths	Comment
`$.o['j j']['k.k']`	`3`	`$['o']['j j']['k.k']`	Named value in nested object
`$.o["j j"]["k.k"]`	`3`	`$['o']['j j']['k.k']`	Named value in nested object
`$["'"]["@"]`	`2`	`$['\'']['@']`	Unusual member names
`$.j`	`{"k": 3}`	`$['j']`	Named value of an object
`$.j.k`	`3`	`$['j']['k']`	Named value in nested object

Query	Result	Result Paths	Comment
`$[*]`	`{"j": 1, "k": 2}` `[5, 3]`	`$['o']` `$['a']`	Object values
`$.o[*]`	`1` `2`	`$['o']['j']` `$['o']['k']`	Object values
`$.o[*]`	`2` `1`	`$['o']['k']` `$['o']['j']`	Alternative result
`$.a[*]`	`5` `3`	`$['a'][0]` `$['a'][1]`	Array members

Escape Sequence	Unicode Character	Description
\b	U+0008	BS backspace
\t	U+0009	HT horizontal tab
\n	U+000A	LF line feed
\f	U+000C	FF form feed
\r	U+000D	CR carriage return
\"	U+0022	quotation mark
\'	U+0027	apostrophe
\/	U+002F	slash (solidus)
\\	U+005C	backslash (reverse solidus)
\uXXXX	U+XXXX	unicode character

Query	Result	Result Paths	Comment
`$[1]`	`"b"`	`$[1]`	Member of array
`$[-2]`	`"a"`	`$[0]`	Member of array, from the end

Query	Result	Result Paths	Comment
`$[1:3]`	`"b"` `"c"`	`$[1]` `$[2]`	Slice with default step
`$[1:5:2]`	`"b"` `"d"`	`$[1]` `$[3]`	Slice with step 2
`$[5:1:-2]`	`"f"` `"d"`	`$[5]` `$[3]`	Slice with negative step
`$[::-1]`	`"g"` `"f"` `"e"` `"d"` `"c"` `"b"` `"a"`	`$[6]` `$[5]` `$[4]` `$[3]` `$[2]` `$[1]` `$[0]`	Slice in reverse order

Precedence	Operator type	Syntax
5	Grouping	`(...)`
4	Logical NOT	`!`
3	Relations	`==` `!=` `<` `<=` `>` `>=` `=~`
2	Logical AND	`&&`
1	Logical OR	`\|\|`

Comparison	Result	Comment
`$.absent1 == $.absent2`	true	Empty nodelists
`$.absent1 <= $.absent2`	true	`==` implies `<=`
`$.absent == 'g'`	false	Empty nodelist
`$.absent1 != $.absent2`	false	Empty nodelists
`$.absent != 'g'`	true	Empty nodelist
`1 <= 2`	true	Numeric comparison
`1 > 2`	false	Strict, numeric comparison
`13 == '13'`	false	Type mismatch
`'a' <= 'b'`	true	String comparison
`'a' > 'b'`	false	Strict, string comparison
`$.obj == $.arr`	false	Type mismatch
`$.obj != $.arr`	true	Type mismatch
`$.obj == $.obj`	true	Object comparison
`$.obj != $.obj`	false	Object comparison
`$.arr == $.arr`	true	Array comparison
`$.arr != $.arr`	false	Array comparison
`$.obj == 17`	false	Type mismatch
`$.obj != 17`	true	Type mismatch
`$.obj <= $.arr`	false	Objects and arrays are not ordered
`$.obj < $.arr`	false	Objects and arrays are not ordered
`$.obj <= $.obj`	true	`==` implies `<=`
`$.arr <= $.arr`	true	`==` implies `<=`
`1 <= $.arr`	false	Arrays are not ordered
`1 >= $.arr`	false	Arrays are not ordered
`1 > $.arr`	false	Arrays are not ordered
`1 < $.arr`	false	Arrays are not ordered
`true <= true`	true	`==` implies `<=`
`true > true`	false	Booleans are not ordered

Query	Result	Result Paths	Comment
`$.a[?@>3.5]`	`5` `4` `6`	`$['a'][1]` `$['a'][4]` `$['a'][5]`	Array value comparison
`$.a[?@.b]`	`{"b": "j"}` `{"b": "k"}`	`$['a'][6]` `$['a'][7]`	Array value existence
`$.a[?@<2 \|\| @.b == "k"]`	`1` `{"b": "k"}`	`$['a'][2]` `$['a'][7]`	Array value logical OR
`$.a[?@.b =~ "i.*"]`	`{"b": "j"}` `{"b": "k"}`	`$['a'][6]` `$['a'][7]`	Array value regular expression
`$.o[?@>1 && @<4]`	`2` `3`	`$['o']['q']` `$['o']['r']`	Object value logical AND
`$.o[?@>1 && @<4]`	`3` `2`	`$['o']['r']` `$['o']['q']`	Alternative result
`$.o[?@.u \|\| @.x]`	`{"u": 6}`	`$['o']['t']`	Object value logical OR
`$.a[?(@.b == $.x)]`	`3` `5` `1` `2` `4` `6`	`$['a'][0]` `$['a'][1]` `$['a'][2]` `$['a'][3]` `$['a'][4]`	Comparison of paths with no values
`$[?(@ == @)]`			Comparison of structured values

Query	Result	Result Paths	Comment
`$..j`	`1` `4`	`$['o']['j']` `$['a'][2][0]['j']`	Object values
`$..j`	`4` `1`	`$['a'][2][0]['j']` `$['o']['j']`	Alternative result
`$..[0]`	`5` `{"j": 4}`	`$['a'][0]` `$['a'][2][0]`	Array values
`$..[0]`	`{"j": 4}` `5`	`$['a'][2][0]` `$['a'][0]`	Alternative result
`$..[]` `$..`	`{"j": 1, "k" : 2}` `[5, 3, [{"j": 4}]]` `1` `2` `5` `3` `[{"j": 4}]` `{"j": 4}` `4`	`$['o']` `$['a']` `$['o']['j']` `$['o']['k']` `$['a'][0]` `$['a'][1]` `$['a'][2]` `$['a'][2][0]` `$['a'][2][0]['j']`	All values

Query	Result	Result Paths	Comment
`$.a`	`null`	`$['a']`	Object value
`$.a[0]`			`null` used as array
`$.a.d`			`null` used as object
`$.b[0]`	`null`	`$['b'][0]`	Array value
`$.b[*]`	`null`	`$['b'][0]`	Array value
`$.b[?@]`	`null`	`$['b'][0]`	Existence
`$.b[?@==null]`	`null`	`$['b'][0]`	Comparison
`$.c[?(@.d==null)]`			Comparison with "missing" value
`$.null`	`1`	`$['null']`	Not JSON null at all, just a string as object key

XPath	JSONPath	Description
`/`	`$`	the root XML element
`.`	`@`	the current XML element
`/`	`.` or `[]`	child operator
`..`	n/a	parent operator
`//`	`..name`, `..[index]`, `..`, or `..[]`	descendants (JSONPath borrows this syntax from E4X)
`*`	`*`	wildcard: All XML elements regardless of their names
`@`	n/a	attribute access: JSON values do not have attributes
`[]`	`[]`	subscript operator used to iterate over XML element collections and for predicates
`\|`	`[,]`	Union operator (results in a combination of node sets); called list operator in JSONPath, allows combining member names, array indices, and slices
n/a	`[start:end:step]`	array slice operator borrowed from ES4
`[]`	`?()`	applies a filter (script) expression
seamless	n/a	expression engine
`()`	n/a	grouping

XPath	JSONPath	Result
`/store/book/author`	`$.store.book[*].author`	the authors of all books in the store
`//author`	`$..author`	all authors
`/store/*`	`$.store.*`	all things in store, which are some books and a red bicycle
`/store//price`	`$.store..price`	the prices of everything in the store
`//book[3]`	`$..book[2]`	the third book
`//book[last()]`	`$..book[-1]`	the last book in order
`//book[position()<3]`	`$..book[0,1]` `$..book[:2]`	the first two books
`//book[isbn]`	`$..book[?(@.isbn)]`	filter all books with isbn number
`//book[price<10]`	`$..book[?(@.price<10)]`	filter all books cheaper than 10
`//*`	`$..*`	all elements in XML document; all member values and array elements contained in input value