Note: This is not an official Apache Software Foundation release, see datafusion-contrib/datafusion-functions-json#5.
This crate provides a set of functions for querying JSON strings in DataFusion. The functions are implemented as scalar functions that can be used in SQL queries.
To use these functions, you'll just need to call:
datafusion_functions_json::register_all(&mut ctx)?;
To register the below JSON functions in your SessionContext
.
-- Create a table with a JSON column stored as a string
CREATE TABLE test_table (id INT, json_col VARCHAR) AS VALUES
(1, '{}'),
(2, '{ "a": 1 }'),
(3, '{ "a": 2 }'),
(4, '{ "a": 1, "b": 2 }'),
(5, '{ "a": 1, "b": 2, "c": 3 }');
-- Check if each document contains the key 'b'
SELECT id, json_contains(json_col, 'b') as json_contains FROM test_table;
-- Results in
-- +----+---------------+
-- | id | json_contains |
-- +----+---------------+
-- | 1 | false |
-- | 2 | false |
-- | 3 | false |
-- | 4 | true |
-- | 5 | true |
-- +----+---------------+
-- Get the value of the key 'a' from each document
SELECT id, json_col->'a' as json_col_a FROM test_table
-- +----+------------+
-- | id | json_col_a |
-- +----+------------+
-- | 1 | {null=} |
-- | 2 | {int=1} |
-- | 3 | {int=2} |
-- | 4 | {int=1} |
-- | 5 | {int=1} |
-- +----+------------+
-
json_contains(json: str, *keys: str | int) -> bool
- true if a JSON string has a specific key (used for the?
operator) -
json_get(json: str, *keys: str | int) -> JsonUnion
- Get a value from a JSON string by its "path" -
json_get_str(json: str, *keys: str | int) -> str
- Get a string value from a JSON string by its "path" -
json_get_int(json: str, *keys: str | int) -> int
- Get an integer value from a JSON string by its "path" -
json_get_float(json: str, *keys: str | int) -> float
- Get a float value from a JSON string by its "path" -
json_get_bool(json: str, *keys: str | int) -> bool
- Get a boolean value from a JSON string by its "path" -
json_get_json(json: str, *keys: str | int) -> str
- Get a nested raw JSON string from a JSON string by its "path" -
json_as_text(json: str, *keys: str | int) -> str
- Get any value from a JSON string by its "path", represented as a string (used for the->>
operator) -
json_length(json: str, *keys: str | int) -> int
- get the length of a JSON string or array
-
->
operator - alias forjson_get
-
->>
operator - alias forjson_as_text
-
?
operator - alias forjson_contains
Cast expressions with json_get
are rewritten to the appropriate method, e.g.
select * from foo where json_get(attributes, 'bar')::string='ham'
Will be rewritten to:
select * from foo where json_get_str(attributes, 'bar')='ham'
-
json_keys(json: str, *keys: str | int) -> list[str]
- get the keys of a JSON string -
json_is_obj(json: str, *keys: str | int) -> bool
- true if the JSON is an object -
json_is_array(json: str, *keys: str | int) -> bool
- true if the JSON is an array -
json_valid(json: str) -> bool
- true if the JSON is valid