-
Notifications
You must be signed in to change notification settings - Fork 1.5k
/
pipeline.yml
69 lines (61 loc) · 1.74 KB
/
pipeline.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
$schema: https://azuremlschemas.azureedge.net/latest/pipelineJob.schema.json
type: pipeline
display_name: nyc_taxi_data_regression
description: Train regression model based on nyc taxi dataset
# <inputs_and_outputs>
outputs:
pipeline_job_trained_model:
type: mlflow_model
mode: rw_mount
pipeline_job_predictions:
mode: rw_mount
pipeline_job_score_report:
mode: rw_mount
# </inputs_and_outputs>
# <jobs>
settings:
default_datastore: azureml:workspaceblobstore
default_compute: azureml:cpu-cluster
continue_on_step_failure: false
jobs:
prep_job:
type: command
component: ./prep.yml
inputs:
raw_data: #using local data, will crate an anonymous data asset
type: uri_folder
path: ./data
outputs:
prep_data:
transform_job:
type: command
component: ./transform.yml
inputs:
clean_data: ${{parent.jobs.prep_job.outputs.prep_data}}
outputs:
transformed_data:
train_job:
type: command
component: ./train.yml
inputs:
training_data: ${{parent.jobs.transform_job.outputs.transformed_data}}
outputs:
model_output: ${{parent.outputs.pipeline_job_trained_model}}
test_data:
predict_job:
type: command
component: ./predict.yml
inputs:
model_input: ${{parent.jobs.train_job.outputs.model_output}}
test_data: ${{parent.jobs.train_job.outputs.test_data}}
outputs:
predictions: ${{parent.outputs.pipeline_job_predictions}}
score_job:
type: command
component: ./score.yml
inputs:
predictions: ${{parent.jobs.predict_job.outputs.predictions}}
model: ${{parent.jobs.train_job.outputs.model_output}}
outputs:
score_report: ${{parent.outputs.pipeline_job_score_report}}
# </jobs>