diff --git a/.circleci/db-migration.sh b/.circleci/db-migration.sh
index 7bcc68659d..e91b3fbe75 100755
--- a/.circleci/db-migration.sh
+++ b/.circleci/db-migration.sh
@@ -13,7 +13,7 @@
# Version of PostgreSQL
readonly POSTGRES_VERSION="14"
# Version of Marquez
-readonly MARQUEZ_VERSION=0.49.0
+readonly MARQUEZ_VERSION=0.50.0
# Build version of Marquez
readonly MARQUEZ_BUILD_VERSION="$(git log --pretty=format:'%h' -n 1)" # SHA1
readonly POSTGRES_PORT=5432
diff --git a/.env.example b/.env.example
index 6cb62675e4..0b1cc7b81c 100644
--- a/.env.example
+++ b/.env.example
@@ -3,4 +3,4 @@ API_ADMIN_PORT=5001
WEB_PORT=3000
POSTGRES_PORT=5432
SEARCH_PORT=9200
-TAG=0.49.0
+TAG=0.50.0
diff --git a/chart/Chart.yaml b/chart/Chart.yaml
index 36cd9ba259..6d4c87ec0e 100644
--- a/chart/Chart.yaml
+++ b/chart/Chart.yaml
@@ -29,4 +29,4 @@ name: marquez
sources:
- https://github.com/MarquezProject/marquez
- https://marquezproject.github.io/marquez/
-version: 0.49.0
+version: 0.50.0
diff --git a/chart/values.yaml b/chart/values.yaml
index 6f91df8ff6..e70dbffd40 100644
--- a/chart/values.yaml
+++ b/chart/values.yaml
@@ -20,7 +20,7 @@ marquez:
image:
registry: docker.io
repository: marquezproject/marquez
- tag: 0.49.0
+ tag: 0.50.0
pullPolicy: IfNotPresent
## Name of the existing secret containing credentials for the Marquez installation.
## When this is specified, it will take precedence over the values configured in the 'db' section.
@@ -80,7 +80,7 @@ web:
image:
registry: docker.io
repository: marquezproject/marquez-web
- tag: 0.49.0
+ tag: 0.50.0
pullPolicy: IfNotPresent
## Marquez website will run on this port
##
diff --git a/clients/java/README.md b/clients/java/README.md
index 2dad915123..58132fe73c 100644
--- a/clients/java/README.md
+++ b/clients/java/README.md
@@ -10,14 +10,14 @@ Maven:
io.github.marquezproject
marquez-java
- 0.49.0
+ 0.50.0
```
or Gradle:
```groovy
-implementation 'io.github.marquezproject:marquez-java:0.49.0
+implementation 'io.github.marquezproject:marquez-java:0.50.0
```
## Usage
diff --git a/docker/up.sh b/docker/up.sh
index e660408134..56878e19da 100755
--- a/docker/up.sh
+++ b/docker/up.sh
@@ -8,9 +8,9 @@
set -e
# Version of Marquez
-readonly VERSION=0.49.0
+readonly VERSION=0.50.0
# Build version of Marquez
-readonly BUILD_VERSION=0.49.0
+readonly BUILD_VERSION=0.50.0
title() {
echo -e "\033[1m${1}\033[0m"
diff --git a/docs/openapi.html b/docs/openapi.html
index 9a4b99add6..475b50216c 100644
--- a/docs/openapi.html
+++ b/docs/openapi.html
@@ -12,2196 +12,377 @@
margin: 0;
}
-
- Marquez (0.49.0) Download OpenAPI specification:Download
Marquez is an open source metadata service for the collection , aggregation , and visualization of a data ecosystem's metadata.
-
Create a namespace Creates a new namespace object. A namespace enables the contextual grouping of related jobs and datasets. Namespaces must contain only letters (a-z
, A-Z
), numbers (0-9
), underscores (_
), dashes (-
), colons (:
), slashes (/
), or dots (.
). A namespace is case-insensitive with a maximum length of 1024
characters. Note jobs and datasets will be unique within a namespace, but not across namespaces.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
Request Body schema: application/json
ownerName required
string
The owner of the namespace.
-
description string
The description of the namespace.
-
put /namespaces/{namespace} http://localhost:5000/api/v1 /namespaces/{namespace}
Request samples Content type application/json
Response samples Content type application/json
{ "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
}
Retrieve a namespace path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
get /namespaces/{namespace} http://localhost:5000/api/v1 /namespaces/{namespace}
Response samples Content type application/json
{ "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
}
Deletes a namespace Soft deletes a namespace, and every job and dataset inside. On next event containing this namespace, the namespace will be undeleted.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
delete /namespaces/{namespace} http://localhost:5000/api/v1 /namespaces/{namespace}
Response samples Content type application/json
{ "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
}
List all namespaces Returns a list of namespaces.
-
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /namespaces http://localhost:5000/api/v1 /namespaces
Response samples Content type application/json
Copy
Expand all Collapse all { "namespaces" :
[ { "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
} ] }
List all received OpenLineage events. Returns a list of OpenLineage events, sorted in direction of passed sort parameter. By default it is desc.
-
query Parameters sortDirection string
Example: sortDirection=name
Sorts the results of your query by indicated direction asc
or desc
.
-
before string <date-time>
Example: before=2022-09-15T07:47:19Z
Returns events before passed date.
-
after string <date-time>
Example: after=2022-09-15T07:47:19Z
Returns events after passed date.
-
limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /events/lineage http://localhost:5000/api/v1 /events/lineage
Response samples Content type application/json
Copy
Expand all Collapse all Create a source Deprecated Creates a new source object. A source is the physical location of a dataset such as a table in PostgreSQL, or topic in Kafka. A source enables the grouping of physical datasets to their physical source.
-
path Parameters source required
string <= 1024 characters
Example: my-source
The name of the source.
-
Request Body schema: application/json
type required
string
The type of the source.
-
connectionUrl required
string <URL>
The URL to the location of the source.
-
description string
The description of the source.
-
put /sources/{source} http://localhost:5000/api/v1 /sources/{source}
Request samples Content type application/json
Response samples Content type application/json
{ "type" : "POSTGRESQL" ,
"name" : "my-source" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"connectionUrl" : "jdbc:postgresql://db.example.com/mydb" ,
"description" : "My first source!"
}
Retrieve a source path Parameters source required
string <= 1024 characters
Example: my-source
The name of the source.
-
get /sources/{source} http://localhost:5000/api/v1 /sources/{source}
Response samples Content type application/json
{ "type" : "POSTGRESQL" ,
"name" : "my-source" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"connectionUrl" : "jdbc:postgresql://db.example.com/mydb" ,
"description" : "My first source!"
}
List all sources Returns a list of sources.
-
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /sources http://localhost:5000/api/v1 /sources
Response samples Content type application/json
Copy
Expand all Collapse all { "sources" :
[ { "type" : "POSTGRESQL" ,
"name" : "my-source" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"connectionUrl" : "jdbc:postgresql://db.example.com/mydb" ,
"description" : "My first source!"
} ] }
Create a dataset Deprecated path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
Request Body schema: application/json
Any of DbTable Stream
type required
string
Value: "DB_TABLE"
The type of the dataset.
-
physicalName required
string
The physical name of the table.
-
sourceName required
string
The name of the source associated with the table.
-
fields required
Array of objects
The fields of the table.
-
tags description string
The description of the table.
-
runId string
The ID associated with the run modifying the table.
-
put /namespaces/{namespace}/datasets/{dataset} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}
Request samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"physicalName" : "public.mytable" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name" : "a" ,
"type" : "INTEGER"
} ,
{ "name" : "b" ,
"type" : "TIMESTAMP"
} ,
{ "name" : "c" ,
"type" : "INTEGER"
} ,
{ "name" : "d" ,
"type" : "INTEGER"
} ] , "description" : "My first dataset!"
}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Retrieve a dataset path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
get /namespaces/{namespace}/datasets/{dataset} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Soft deletes dataset. Soft deletes dataset. It will be un-deleted if new OpenLineage event containing this dataset comes.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
delete /namespaces/{namespace}/datasets/{dataset} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Retrieve a version for a dataset Returns a version for a dataset.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
version required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
The ID of the job or dataset version.
-
get /namespaces/{namespace}/datasets/{dataset}/versions/{version} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/versions/{version}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"description" : "My first dataset!" ,
"createdByRun" :
{ "id" : "0e89b60a-d80d-42ae-a12b-bd79ae1fb576" ,
"createdAt" : "2019-05-09T18:52:35.620763Z" ,
"updatedAt" : "2019-05-09T18:53:41.461122Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "COMPLETED" ,
"startedAt" : "2021-02-05T18:53:33.245492Z" ,
"endedAt" : "2021-02-05T18:53:41.461122Z" ,
"durationMs" : 8216 ,
"jobVersion" :
{ "namespace" : "my-namespace" ,
"name" : "my_processing_job" ,
"version" : "0ba5b13b-350e-40f3-ba3f-cc00a4e92d11"
} , "inputVersions" :
[ { "namespace" : "my-namespace" ,
"name" : "an_input_dataset" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad"
} ] , } }
List all versions for a dataset Returns a list of versions for a dataset.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /namespaces/{namespace}/datasets/{dataset}/versions http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/versions
Response samples Content type application/json
Copy
Expand all Collapse all { "versions" :
[ { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"description" : "My first dataset!" ,
"createdByRun" :
{ "id" : "0e89b60a-d80d-42ae-a12b-bd79ae1fb576" ,
"createdAt" : "2019-05-09T18:52:35.620763Z" ,
"updatedAt" : "2019-05-09T18:53:41.461122Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "COMPLETED" ,
"startedAt" : "2021-02-05T18:53:33.245492Z" ,
"endedAt" : "2021-02-05T18:53:41.461122Z" ,
"durationMs" : 8216 ,
"jobVersion" :
{ "namespace" : "my-namespace" ,
"name" : "my_processing_job" ,
"version" : "0ba5b13b-350e-40f3-ba3f-cc00a4e92d11"
} , "inputVersions" :
[ { "namespace" : "my-namespace" ,
"name" : "an_input_dataset" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad"
} ] , } } ] }
List all datasets Returns a list of datasets.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /namespaces/{namespace}/datasets http://localhost:5000/api/v1 /namespaces/{namespace}/datasets
Response samples Content type application/json
Copy
Expand all Collapse all { "datasets" :
[ { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} ] , "totalCount" : 0
}
Tag a dataset Tag an existing dataset.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
tag required
string
Example: SENSITIVE
post /namespaces/{namespace}/datasets/{dataset}/tags/{tag} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/tags/{tag}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Tag a field Tag an existing field of a dataset.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
-
field required
tag required
string
Example: SENSITIVE
post /namespaces/{namespace}/datasets/{dataset}/fields/{field}/tags/{tag} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/fields/{field}/tags/{tag}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Create a job Deprecated Creates a new job object. All job objects are immutable and are uniquely identified by a generated ID. Marquez will create a version of a job each time the contents of the object is modified. For example, the location
of a job may change over time resulting in new versions. The accumulated versions can be listed, used to rerun a specific job version or possibly help debug a failed job run.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
Request Body schema: application/json
id type required
string (JobType)
Enum: "BATCH" "STREAM" "SERVICE"
inputs required
Array of objects (DatasetId) unique
The set of input datasets.
-
outputs required
Array of objects (DatasetId) unique
The set of output datasets.
-
location string <URL>
The URL of the job source code or artifact.
-
context object
Deprecated
A key/value pair that must be of type string
. A context can be used for getting additional details about the job.
-
description string
The description of the job.
-
runId string
An optional run ID used to associate a job version to an existing job run.
-
put /namespaces/{namespace}/jobs/{job} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}
Request samples Content type application/json
Copy
Expand all Collapse all Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Retrieve a job path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
get /namespaces/{namespace}/jobs/{job} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Soft deletes job. Soft deletes job. It will be un-deleted if new OpenLineage event containing this job comes.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
delete /namespaces/{namespace}/jobs/{job} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
List all jobs Returns a list of jobs.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /namespaces/{namespace}/jobs http://localhost:5000/api/v1 /namespaces/{namespace}/jobs
Response samples Content type application/json
Copy
Expand all Collapse all { "jobs" :
[ { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} ] , "totalCount" : 0
}
Retrieve a version for a job Returns a version for a job.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
version required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
The ID of the job or dataset version.
-
get /namespaces/{namespace}/jobs/{job}/versions/{version} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/versions/{version}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"version" : "56472c57-a2ef-4218-b7b7-d2af02a343fd" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"facets" : { }
}
List all versions for a job Returns a list of versions for a job.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
get /namespaces/{namespace}/jobs/{job}/versions http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/versions
Response samples Content type application/json
Copy
Expand all Collapse all { "versions" :
[ { "type" : "BATCH" ,
"name" : "my-job" ,
"version" : "56472c57-a2ef-4218-b7b7-d2af02a343fd" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"facets" : { }
} ] }
Create a run Deprecated Creates a new run object for a job.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
Request Body schema: application/json
id string <uuid>
An optional user-provided unique ID of the run. A run ID must be an UUID . If an ID for the run is not provided, a random UUID will be generated for the given run.
-
nominalStartTime string <date-time>
An ISO-8601 timestamp representing the nominal start time of the run.
-
nominalEndTime string <date-time>
An ISO-8601 timestamp representing the nominal end time of the run.
-
args object
The arguments of the run.
-
post /namespaces/{namespace}/jobs/{job}/runs http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/runs
Request samples Content type application/json
Copy
Expand all Collapse all Response samples Content type application/json
Example IncompleteRun IncompleteRun Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
List all runs Returns a list of runs for a job.
-
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
-
job required
string <= 1024 characters
Example: my-job
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
offset integer
Default: 0
The initial position from which to return results.
-
get /namespaces/{namespace}/jobs/{job}/runs http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/runs
Response samples Content type application/json
Copy
Expand all Collapse all { "runs" :
[ { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "COMPLETED" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : "2019-05-09T20:05:46.815920Z" ,
"durationMs" : 4250894125 ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
} ] }
Retrieve a run path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
get /jobs/runs/{id} http://localhost:5000/api/v1 /jobs/runs/{id}
Response samples Content type application/json
Example IncompleteRun IncompleteRun Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Retrieve run or job facets for a run. Retrieve run or job facets for a run.
-
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters type required
string
Enum: "run" "job"
Indicates if should return job or run facets.
-
get /jobs/runs/{id}/facets http://localhost:5000/api/v1 /jobs/runs/{id}/facets
Response samples Content type application/json
Copy
Expand all Collapse all Start a run Deprecated Marks the run as RUNNING
.
-
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
-
post /jobs/runs/{id}/start http://localhost:5000/api/v1 /jobs/runs/{id}/start
Response samples Content type application/json
Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Complete a run Deprecated Marks the run as COMPLETED
.
-
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
-
post /jobs/runs/{id}/complete http://localhost:5000/api/v1 /jobs/runs/{id}/complete
Response samples Content type application/json
Example IncompleteRun IncompleteRun Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Fail a run Deprecated Marks the run as FAILED
.
-
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
-
post /jobs/runs/{id}/fail http://localhost:5000/api/v1 /jobs/runs/{id}/fail
Response samples Content type application/json
Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Abort a run Deprecated Marks the run as ABORTED
.
-
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
-
post /jobs/runs/{id}/abort http://localhost:5000/api/v1 /jobs/runs/{id}/abort
Response samples Content type application/json
Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Record a single lineage event Receive, process, and store lineage metadata using the OpenLineage standard.
-
Request Body schema: application/json
post /lineage http://localhost:5000/api/v1 /lineage
Request samples Content type application/json
Copy
Expand all Collapse all Get a lineage graph query Parameters nodeId required
string
Example: nodeId=dataset:food_delivery:public.delivery_7_days
The ID of the node. A node can either be a dataset node, a dataset field node or a job node. The format of nodeId for dataset is dataset:<namespace_of_dataset>:<name_of_the_dataset>
, for dataset field is datasetField:<namespace_of_dataset>:<name_of_the_dataset>:<name_of_field>
, and for job is job:<namespace_of_the_job>:<name_of_the_job>
.
-
depth integer
Default: 20
Depth of lineage graph to create.
-
get /lineage http://localhost:5000/api/v1 /lineage
Response samples Content type application/json
Copy
Expand all Collapse all { "graph" :
[ { "id" : "string" ,
"type" : "JOB" ,
"data" :
{ "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} , "inEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] , "outEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] } ] }
Get the upstream lineage for a given run get /runlineage/upstream http://localhost:5000/api/v1 /runlineage/upstream
Response samples Content type application/json
Copy
Expand all Collapse all Get a column lineage graph query Parameters nodeId required
string
Example: nodeId=dataset:food_delivery:public.delivery_7_days
The ID of the node. A node can either be a dataset node, a dataset field node or a job node. The format of nodeId for dataset is dataset:<namespace_of_dataset>:<name_of_the_dataset>
, for dataset field is datasetField:<namespace_of_dataset>:<name_of_the_dataset>:<name_of_field>
, and for job is job:<namespace_of_the_job>:<name_of_the_job>
.
-
depth integer
Default: 20
Depth of lineage graph to create.
-
withDownstream boolean
Default: false
Determines if downstream lineage should be returned.
-
get /column-lineage http://localhost:5000/api/v1 /column-lineage
Response samples Content type application/json
Copy
Expand all Collapse all { "graph" :
[ { "id" : "string" ,
"type" : "JOB" ,
"data" :
{ "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} , "inEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] , "outEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] } ] }
Query all datasets and jobs Returns one or more datasets and jobs of your query.
-
query Parameters q required
string
Example: q=my-dataset
Query containing pattern to match; datasets and jobs pattern matching is string based and case-insensitive. Use percent sign (%
) to match any string of zero or more characters (my-job%
), or an underscore (_
) to match a single character (_job_
).
-
filter string
Example: filter=dataset
Filters the results of your query by dataset
or job
.
-
sort string
Example: sort=name
Sorts the results of your query by name
or updated_at
.
-
limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
-
namespace string <= 1024 characters
Example: namespace=my-namespace
Match jobs or datasets within the given namespace.
-
before string YYYY-MM-DD
Example: before=2022-09-15
Match jobs or datasets before YYYY-MM-DD
.
-
after string YYYY-MM-DD
Example: after=2022-09-15
Match jobs or datasets after YYYY-MM-DD
.
-
get /search http://localhost:5000/api/v1 /search
Response samples Content type application/json
Copy
Expand all Collapse all { "totalCount" : 1 ,
"results" :
[ { "type" : "DATASET" ,
"name" : "public.delivery_7_days" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "food_delivery" ,
"nodeId" : "dataset:food_delivery:public.delivery_7_days"
} ] }
-
+ " fill="currentColor">
Marquez (0.50.0) Download OpenAPI specification:Download
Marquez is an open source metadata service for the collection , aggregation , and visualization of a data ecosystem's metadata.
+
Create a namespace Creates a new namespace object. A namespace enables the contextual grouping of related jobs and datasets. Namespaces must contain only letters (a-z
, A-Z
), numbers (0-9
), underscores (_
), dashes (-
), colons (:
), slashes (/
), or dots (.
). A namespace is case-insensitive with a maximum length of 1024
characters. Note jobs and datasets will be unique within a namespace, but not across namespaces.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
Request Body schema: application/json
ownerName required
string
The owner of the namespace.
+
description string
The description of the namespace.
+
put /namespaces/{namespace} http://localhost:5000/api/v1 /namespaces/{namespace}
Request samples Content type application/json
Response samples Content type application/json
{ "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
}
Retrieve a namespace path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
get /namespaces/{namespace} http://localhost:5000/api/v1 /namespaces/{namespace}
Response samples Content type application/json
{ "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
}
Deletes a namespace Soft deletes a namespace, and every job and dataset inside. On next event containing this namespace, the namespace will be undeleted.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
delete /namespaces/{namespace} http://localhost:5000/api/v1 /namespaces/{namespace}
Response samples Content type application/json
{ "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
}
List all namespaces Returns a list of namespaces.
+
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /namespaces http://localhost:5000/api/v1 /namespaces
Response samples Content type application/json
Copy
Expand all Collapse all { "namespaces" :
[ { "name" : "my-namespace" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"ownerName" : "me" ,
"description" : "My first namespace!"
} ] }
List all received OpenLineage events. Returns a list of OpenLineage events, sorted in direction of passed sort parameter. By default it is desc.
+
query Parameters sortDirection string
Example: sortDirection=name
Sorts the results of your query by indicated direction asc
or desc
.
+
before string <date-time>
Example: before=2022-09-15T07:47:19Z
Returns events before passed date.
+
after string <date-time>
Example: after=2022-09-15T07:47:19Z
Returns events after passed date.
+
limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /events/lineage http://localhost:5000/api/v1 /events/lineage
Response samples Content type application/json
Copy
Expand all Collapse all Create a source Deprecated Creates a new source object. A source is the physical location of a dataset such as a table in PostgreSQL, or topic in Kafka. A source enables the grouping of physical datasets to their physical source.
+
path Parameters source required
string <= 1024 characters
Example: my-source
The name of the source.
+
Request Body schema: application/json
type required
string
The type of the source.
+
connectionUrl required
string <URL>
The URL to the location of the source.
+
description string
The description of the source.
+
put /sources/{source} http://localhost:5000/api/v1 /sources/{source}
Request samples Content type application/json
Response samples Content type application/json
{ "type" : "POSTGRESQL" ,
"name" : "my-source" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"connectionUrl" : "jdbc:postgresql://db.example.com/mydb" ,
"description" : "My first source!"
}
Retrieve a source path Parameters source required
string <= 1024 characters
Example: my-source
The name of the source.
+
get /sources/{source} http://localhost:5000/api/v1 /sources/{source}
Response samples Content type application/json
{ "type" : "POSTGRESQL" ,
"name" : "my-source" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"connectionUrl" : "jdbc:postgresql://db.example.com/mydb" ,
"description" : "My first source!"
}
List all sources Returns a list of sources.
+
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /sources http://localhost:5000/api/v1 /sources
Response samples Content type application/json
Copy
Expand all Collapse all { "sources" :
[ { "type" : "POSTGRESQL" ,
"name" : "my-source" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"connectionUrl" : "jdbc:postgresql://db.example.com/mydb" ,
"description" : "My first source!"
} ] }
Create a dataset Deprecated path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
Request Body schema: application/json
Any of DbTable Stream
type required
string
Value: "DB_TABLE"
The type of the dataset.
+
physicalName required
string
The physical name of the table.
+
sourceName required
string
The name of the source associated with the table.
+
fields required
Array of objects
The fields of the table.
+
tags description string
The description of the table.
+
runId string
The ID associated with the run modifying the table.
+
put /namespaces/{namespace}/datasets/{dataset} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}
Request samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"physicalName" : "public.mytable" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name" : "a" ,
"type" : "INTEGER"
} ,
{ "name" : "b" ,
"type" : "TIMESTAMP"
} ,
{ "name" : "c" ,
"type" : "INTEGER"
} ,
{ "name" : "d" ,
"type" : "INTEGER"
} ] , "description" : "My first dataset!"
}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Retrieve a dataset path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
get /namespaces/{namespace}/datasets/{dataset} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Soft deletes dataset. Soft deletes dataset. It will be un-deleted if new OpenLineage event containing this dataset comes.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
delete /namespaces/{namespace}/datasets/{dataset} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Retrieve a version for a dataset Returns a version for a dataset.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
version required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
The ID of the job or dataset version.
+
get /namespaces/{namespace}/datasets/{dataset}/versions/{version} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/versions/{version}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"description" : "My first dataset!" ,
"createdByRun" :
{ "id" : "0e89b60a-d80d-42ae-a12b-bd79ae1fb576" ,
"createdAt" : "2019-05-09T18:52:35.620763Z" ,
"updatedAt" : "2019-05-09T18:53:41.461122Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "COMPLETED" ,
"startedAt" : "2021-02-05T18:53:33.245492Z" ,
"endedAt" : "2021-02-05T18:53:41.461122Z" ,
"durationMs" : 8216 ,
"jobVersion" :
{ "namespace" : "my-namespace" ,
"name" : "my_processing_job" ,
"version" : "0ba5b13b-350e-40f3-ba3f-cc00a4e92d11"
} , "inputVersions" :
[ { "namespace" : "my-namespace" ,
"name" : "an_input_dataset" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad"
} ] , } }
List all versions for a dataset Returns a list of versions for a dataset.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /namespaces/{namespace}/datasets/{dataset}/versions http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/versions
Response samples Content type application/json
Copy
Expand all Collapse all { "versions" :
[ { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"description" : "My first dataset!" ,
"createdByRun" :
{ "id" : "0e89b60a-d80d-42ae-a12b-bd79ae1fb576" ,
"createdAt" : "2019-05-09T18:52:35.620763Z" ,
"updatedAt" : "2019-05-09T18:53:41.461122Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "COMPLETED" ,
"startedAt" : "2021-02-05T18:53:33.245492Z" ,
"endedAt" : "2021-02-05T18:53:41.461122Z" ,
"durationMs" : 8216 ,
"jobVersion" :
{ "namespace" : "my-namespace" ,
"name" : "my_processing_job" ,
"version" : "0ba5b13b-350e-40f3-ba3f-cc00a4e92d11"
} , "inputVersions" :
[ { "namespace" : "my-namespace" ,
"name" : "an_input_dataset" ,
"version" : "d224dac0-35d7-4d9b-bbbe-6fff1a8485ad"
} ] , } } ] }
List all datasets Returns a list of datasets.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /namespaces/{namespace}/datasets http://localhost:5000/api/v1 /namespaces/{namespace}/datasets
Response samples Content type application/json
Copy
Expand all Collapse all { "datasets" :
[ { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} ] , "totalCount" : 0
}
Tag a dataset Tag an existing dataset.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
tag required
string
Example: SENSITIVE
post /namespaces/{namespace}/datasets/{dataset}/tags/{tag} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/tags/{tag}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Tag a field Tag an existing field of a dataset.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
dataset required
string <= 1024 characters
Example: my-dataset
The name of the dataset.
+
field required
tag required
string
Example: SENSITIVE
post /namespaces/{namespace}/datasets/{dataset}/fields/{field}/tags/{tag} http://localhost:5000/api/v1 /namespaces/{namespace}/datasets/{dataset}/fields/{field}/tags/{tag}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Create a job Deprecated Creates a new job object. All job objects are immutable and are uniquely identified by a generated ID. Marquez will create a version of a job each time the contents of the object is modified. For example, the location
of a job may change over time resulting in new versions. The accumulated versions can be listed, used to rerun a specific job version or possibly help debug a failed job run.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
Request Body schema: application/json
id type required
string (JobType)
Enum: "BATCH" "STREAM" "SERVICE"
inputs required
Array of objects (DatasetId) unique
The set of input datasets.
+
outputs required
Array of objects (DatasetId) unique
The set of output datasets.
+
location string <URL>
The URL of the job source code or artifact.
+
context object
Deprecated
A key/value pair that must be of type string
. A context can be used for getting additional details about the job.
+
description string
The description of the job.
+
runId string
An optional run ID used to associate a job version to an existing job run.
+
put /namespaces/{namespace}/jobs/{job} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}
Request samples Content type application/json
Copy
Expand all Collapse all Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"latestRuns" : [ ] ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Retrieve a job path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
get /namespaces/{namespace}/jobs/{job} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"latestRuns" : [ ] ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
Soft deletes job. Soft deletes job. It will be un-deleted if new OpenLineage event containing this job comes.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
delete /namespaces/{namespace}/jobs/{job} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"latestRuns" : [ ] ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
}
List all jobs Returns a list of jobs.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /namespaces/{namespace}/jobs http://localhost:5000/api/v1 /namespaces/{namespace}/jobs
Response samples Content type application/json
Copy
Expand all Collapse all { "jobs" :
[ { "type" : "BATCH" ,
"name" : "my-job" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"latestRun" : null ,
"latestRuns" : [ ] ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} ] , "totalCount" : 0
}
Retrieve a version for a job Returns a version for a job.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
version required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
The ID of the job or dataset version.
+
get /namespaces/{namespace}/jobs/{job}/versions/{version} http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/versions/{version}
Response samples Content type application/json
Copy
Expand all Collapse all { "type" : "BATCH" ,
"name" : "my-job" ,
"version" : "56472c57-a2ef-4218-b7b7-d2af02a343fd" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"facets" : { }
}
List all versions for a job Returns a list of versions for a job.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
get /namespaces/{namespace}/jobs/{job}/versions http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/versions
Response samples Content type application/json
Copy
Expand all Collapse all { "versions" :
[ { "type" : "BATCH" ,
"name" : "my-job" ,
"version" : "56472c57-a2ef-4218-b7b7-d2af02a343fd" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"outputs" : [ ] ,
"description" : "My first job!" ,
"facets" : { }
} ] }
Create a run Deprecated Creates a new run object for a job.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
Request Body schema: application/json
id string <uuid>
An optional user-provided unique ID of the run. A run ID must be an UUID . If an ID for the run is not provided, a random UUID will be generated for the given run.
+
nominalStartTime string <date-time>
An ISO-8601 timestamp representing the nominal start time of the run.
+
nominalEndTime string <date-time>
An ISO-8601 timestamp representing the nominal end time of the run.
+
args object
The arguments of the run.
+
post /namespaces/{namespace}/jobs/{job}/runs http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/runs
Request samples Content type application/json
Copy
Expand all Collapse all Response samples Content type application/json
Example IncompleteRun IncompleteRun Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
List all runs Returns a list of runs for a job.
+
path Parameters namespace required
string <= 1024 characters
Example: my-namespace
The name of the namespace.
+
job required
string <= 1024 characters
Example: my-job
query Parameters limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
offset integer
Default: 0
The initial position from which to return results.
+
get /namespaces/{namespace}/jobs/{job}/runs http://localhost:5000/api/v1 /namespaces/{namespace}/jobs/{job}/runs
Response samples Content type application/json
Copy
Expand all Collapse all { "runs" :
[ { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "COMPLETED" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : "2019-05-09T20:05:46.815920Z" ,
"durationMs" : 4250894125 ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
} ] }
Retrieve a run path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
get /jobs/runs/{id} http://localhost:5000/api/v1 /jobs/runs/{id}
Response samples Content type application/json
Example IncompleteRun IncompleteRun Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Retrieve run or job facets for a run. Retrieve run or job facets for a run.
+
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters type required
string
Enum: "run" "job"
Indicates if should return job or run facets.
+
get /jobs/runs/{id}/facets http://localhost:5000/api/v1 /jobs/runs/{id}/facets
Response samples Content type application/json
Copy
Expand all Collapse all Start a run Deprecated Marks the run as RUNNING
.
+
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
+
post /jobs/runs/{id}/start http://localhost:5000/api/v1 /jobs/runs/{id}/start
Response samples Content type application/json
Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Complete a run Deprecated Marks the run as COMPLETED
.
+
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
+
post /jobs/runs/{id}/complete http://localhost:5000/api/v1 /jobs/runs/{id}/complete
Response samples Content type application/json
Example IncompleteRun IncompleteRun Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Fail a run Deprecated Marks the run as FAILED
.
+
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
+
post /jobs/runs/{id}/fail http://localhost:5000/api/v1 /jobs/runs/{id}/fail
Response samples Content type application/json
Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Abort a run Deprecated Marks the run as ABORTED
.
+
path Parameters id required
string <uuid>
Example: ea9badc5-7cb2-49af-9a9f-155771d3a797
query Parameters at string <date-time>
An ISO-8601 timestamp representing the time when the run transitioned.
+
post /jobs/runs/{id}/abort http://localhost:5000/api/v1 /jobs/runs/{id}/abort
Response samples Content type application/json
Copy
Expand all Collapse all { "id" : "870492da-ecfb-4be0-91b9-9a89ddd3db90" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"nominalStartTime" : null ,
"nominalEndTime" : null ,
"state" : "RUNNING" ,
"startedAt" : "2019-05-09T15:17:32.690346" ,
"endedAt" : null ,
"durationMs" : null ,
"args" :
{ "email" : "me@example.com" ,
"emailOnFailure" : "false" ,
"emailOnRetry" : "true" ,
"retries" : "1"
} , "facets" : { }
}
Record a single lineage event Receive, process, and store lineage metadata using the OpenLineage standard.
+
Request Body schema: application/json
post /lineage http://localhost:5000/api/v1 /lineage
Request samples Content type application/json
Copy
Expand all Collapse all Get a lineage graph query Parameters nodeId required
string
Example: nodeId=dataset:food_delivery:public.delivery_7_days
The ID of the node. A node can either be a dataset node, a dataset field node or a job node. The format of nodeId for dataset is dataset:<namespace_of_dataset>:<name_of_the_dataset>
, for dataset field is datasetField:<namespace_of_dataset>:<name_of_the_dataset>:<name_of_field>
, and for job is job:<namespace_of_the_job>:<name_of_the_job>
.
+
depth integer
Default: 20
Depth of lineage graph to create.
+
get /lineage http://localhost:5000/api/v1 /lineage
Response samples Content type application/json
Copy
Expand all Collapse all { "graph" :
[ { "id" : "string" ,
"type" : "JOB" ,
"data" :
{ "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} , "inEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] , "outEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] } ] }
Get the upstream lineage for a given run get /runlineage/upstream http://localhost:5000/api/v1 /runlineage/upstream
Response samples Content type application/json
Copy
Expand all Collapse all Get a column lineage graph query Parameters nodeId required
string
Example: nodeId=dataset:food_delivery:public.delivery_7_days
The ID of the node. A node can either be a dataset node, a dataset field node or a job node. The format of nodeId for dataset is dataset:<namespace_of_dataset>:<name_of_the_dataset>
, for dataset field is datasetField:<namespace_of_dataset>:<name_of_the_dataset>:<name_of_field>
, and for job is job:<namespace_of_the_job>:<name_of_the_job>
.
+
depth integer
Default: 20
Depth of lineage graph to create.
+
withDownstream boolean
Default: false
Determines if downstream lineage should be returned.
+
get /column-lineage http://localhost:5000/api/v1 /column-lineage
Response samples Content type application/json
Copy
Expand all Collapse all { "graph" :
[ { "id" : "string" ,
"type" : "JOB" ,
"data" :
{ "type" : "DB_TABLE" ,
"name" : "my-dataset" ,
"physicalName" : "public.mytable" ,
"createdAt" : "2019-05-09T19:49:24.201361Z" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "my-namespace" ,
"sourceName" : "my-source" ,
"fields" :
[ { "name'" : "a" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "b" ,
"type" : "TIMESTAMP" ,
"tags" : [ ]
} ,
{ "name'" : "c" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ,
{ "name'" : "d" ,
"type" : "INTEGER" ,
"tags" : [ ]
} ] , "tags" : [ ] ,
"lastModifiedAt" : null ,
"description" : "My first dataset!" ,
"facets" : { } ,
"currentVersion" : "b1d626a2-6d3a-475e-9ecf-943176d4a8c6"
} , "inEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] , "outEdges" :
[ { "origin" : "string" ,
"destination" : "string"
} ] } ] }
Query all datasets and jobs Returns one or more datasets and jobs of your query.
+
query Parameters q required
string
Example: q=my-dataset
Query containing pattern to match; datasets and jobs pattern matching is string based and case-insensitive. Use percent sign (%
) to match any string of zero or more characters (my-job%
), or an underscore (_
) to match a single character (_job_
).
+
filter string
Example: filter=dataset
Filters the results of your query by dataset
or job
.
+
sort string
Example: sort=name
Sorts the results of your query by name
or updated_at
.
+
limit integer
Default: 100
Example: limit=25
The number of results to return from offset.
+
namespace string <= 1024 characters
Example: namespace=my-namespace
Match jobs or datasets within the given namespace.
+
before string YYYY-MM-DD
Example: before=2022-09-15
Match jobs or datasets before YYYY-MM-DD
.
+
after string YYYY-MM-DD
Example: after=2022-09-15
Match jobs or datasets after YYYY-MM-DD
.
+
get /search http://localhost:5000/api/v1 /search
Response samples Content type application/json
Copy
Expand all Collapse all { "totalCount" : 1 ,
"results" :
[ { "type" : "DATASET" ,
"name" : "public.delivery_7_days" ,
"updatedAt" : "2019-05-09T19:49:24.201361Z" ,
"namespace" : "food_delivery" ,
"nodeId" : "dataset:food_delivery:public.delivery_7_days"
} ] }
+
-