Commit 287277da authored by Brandon Schoenfeld's avatar Brandon Schoenfeld

added byu-dml primitives and pipelines

parent 48557efa
{
"id": "74f5ccb1-053a-46cf-ad7f-005f67a15652",
"schema": "https://metadata.datadrivendiscovery.org/schemas/v0/pipeline.json",
"created": "2019-04-19T22:18:52.148196Z",
"context": "TESTING",
"inputs": [
{
"name": "inputs"
}
],
"outputs": [
{
"data": "steps.6.produce",
"name": "predictions"
}
],
"steps": [
{
"type": "PRIMITIVE",
"primitive": {
"id": "4b42ce1e-9b98-4a25-b68e-fad13311eb65",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.dataset_to_dataframe.Common",
"name": "Extract a DataFrame from a Dataset",
"digest": "b1c248751b314d78349de9c5590f3e970e1c5514b78a90707f4dc267c4ca7bf1"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "inputs.0"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d510cb7a-1782-4f51-b44c-58f0236e47c7",
"version": "0.5.0",
"python_path": "d3m.primitives.data_transformation.column_parser.DataFrameCommon",
"name": "Parses strings into their types",
"digest": "fd9ba65a05a5fae4ab1536f385656099dbe3b42670e7353124379157bf14803b"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "298167ba6e068fe75d94bfa8793827436e735f0d44551d738da045dc904edf0f"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/Attribute"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "298167ba6e068fe75d94bfa8793827436e735f0d44551d738da045dc904edf0f"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/TrueTarget"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "ebfeb6f0-e366-4082-b1a7-602fd50acc96",
"version": "0.1.4",
"python_path": "d3m.primitives.data_preprocessing.random_sampling_imputer.BYU",
"name": "Random Sampling Imputer",
"digest": "5f808d46ed8e5dace09749455f4e05adc542d3218632919c3307351d59d0da41"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.2.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "f0fd7a62-09b5-3abc-93bb-f5f999f7cc80",
"version": "v2019.4.4",
"python_path": "d3m.primitives.regression.random_forest.SKlearn",
"name": "sklearn.ensemble.forest.RandomForestRegressor",
"digest": "d11179cee4ab21f3e6c0308775c5c5d22fc7a07dbceafeb9f86565c52d105765"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.4.produce"
},
"outputs": {
"type": "CONTAINER",
"data": "steps.3.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"use_semantic_types": {
"type": "VALUE",
"data": true
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "8d38b340-f83f-4877-baaa-162f8e551736",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.construct_predictions.DataFrameCommon",
"name": "Construct pipeline predictions output",
"digest": "a16e280fce14ef80dba3035c1dbf0e2571fe7d02acd95b05f2787fd1886484e4"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.5.produce"
},
"reference": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
}
],
"digest": "7d70b2e66bf743485b2dfa06e7ca0928cd595714a3912642699b94e7678760c2"
}
\ No newline at end of file
{
"problem": "196_autoMpg_problem",
"full_inputs": [
"196_autoMpg_dataset"
],
"train_inputs": [
"196_autoMpg_dataset_TRAIN"
],
"test_inputs": [
"196_autoMpg_dataset_TEST"
],
"score_inputs": [
"196_autoMpg_dataset_SCORE"
]
}
\ No newline at end of file
{
"id": "f4fe3fcc-45fe-4c85-8845-549e2f466f21",
"schema": "https://metadata.datadrivendiscovery.org/schemas/v0/pipeline.json",
"created": "2019-04-19T22:18:51.691000Z",
"context": "TESTING",
"inputs": [
{
"name": "inputs"
}
],
"outputs": [
{
"data": "steps.6.produce",
"name": "predictions"
}
],
"steps": [
{
"type": "PRIMITIVE",
"primitive": {
"id": "4b42ce1e-9b98-4a25-b68e-fad13311eb65",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.dataset_to_dataframe.Common",
"name": "Extract a DataFrame from a Dataset",
"digest": "b1c248751b314d78349de9c5590f3e970e1c5514b78a90707f4dc267c4ca7bf1"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "inputs.0"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d510cb7a-1782-4f51-b44c-58f0236e47c7",
"version": "0.5.0",
"python_path": "d3m.primitives.data_transformation.column_parser.DataFrameCommon",
"name": "Parses strings into their types",
"digest": "fd9ba65a05a5fae4ab1536f385656099dbe3b42670e7353124379157bf14803b"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "298167ba6e068fe75d94bfa8793827436e735f0d44551d738da045dc904edf0f"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/Attribute"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "298167ba6e068fe75d94bfa8793827436e735f0d44551d738da045dc904edf0f"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/TrueTarget"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "ebfeb6f0-e366-4082-b1a7-602fd50acc96",
"version": "0.1.4",
"python_path": "d3m.primitives.data_preprocessing.random_sampling_imputer.BYU",
"name": "Random Sampling Imputer",
"digest": "5f808d46ed8e5dace09749455f4e05adc542d3218632919c3307351d59d0da41"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.2.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "1dd82833-5692-39cb-84fb-2455683075f3",
"version": "v2019.4.4",
"python_path": "d3m.primitives.classification.random_forest.SKlearn",
"name": "sklearn.ensemble.forest.RandomForestClassifier",
"digest": "7ea6cf52c696329ea9270dfc9d1cea219de388b5714ad850c6a055bd9b699ed9"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.4.produce"
},
"outputs": {
"type": "CONTAINER",
"data": "steps.3.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"use_semantic_types": {
"type": "VALUE",
"data": true
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "8d38b340-f83f-4877-baaa-162f8e551736",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.construct_predictions.DataFrameCommon",
"name": "Construct pipeline predictions output",
"digest": "a16e280fce14ef80dba3035c1dbf0e2571fe7d02acd95b05f2787fd1886484e4"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.5.produce"
},
"reference": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
}
],
"digest": "371720cc680bbaf6753f813c7c6be96dfeeefa75a505754c7eb13e020140d3f7"
}
\ No newline at end of file
{
"problem": "185_baseball_problem",
"full_inputs": [
"185_baseball_dataset"
],
"train_inputs": [
"185_baseball_dataset_TRAIN"
],
"test_inputs": [
"185_baseball_dataset_TEST"
],
"score_inputs": [
"185_baseball_dataset_SCORE"
]
}
\ No newline at end of file
{
"id": "3013ad40-7c51-4991-b0fb-dbec65607979",
"schema": "https://metadata.datadrivendiscovery.org/schemas/v0/pipeline.json",
"created": "2019-04-19T22:18:52.253052Z",
"context": "TESTING",
"inputs": [
{
"name": "inputs"
}
],
"outputs": [
{
"data": "steps.7.produce",
"name": "predictions"
}
],
"steps": [
{
"type": "PRIMITIVE",
"primitive": {
"id": "4b42ce1e-9b98-4a25-b68e-fad13311eb65",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.dataset_to_dataframe.Common",
"name": "Extract a DataFrame from a Dataset",
"digest": "b1c248751b314d78349de9c5590f3e970e1c5514b78a90707f4dc267c4ca7bf1"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "inputs.0"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d510cb7a-1782-4f51-b44c-58f0236e47c7",
"version": "0.5.0",
"python_path": "d3m.primitives.data_transformation.column_parser.DataFrameCommon",
"name": "Parses strings into their types",
"digest": "fd9ba65a05a5fae4ab1536f385656099dbe3b42670e7353124379157bf14803b"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "28d12214-8cb0-4ac0-8946-d31fcbcd4142",
"version": "0.4.3",
"python_path": "d3m.primitives.metafeature_extraction.meta_feature_extractor.BYU",
"name": "Dataset Metafeature Extraction",
"digest": "aa5e61cbb77cdf73eb24ceeb0dce0892a8580bc8513c0f33dc1a6b230abd427d"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "298167ba6e068fe75d94bfa8793827436e735f0d44551d738da045dc904edf0f"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/Attribute"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "298167ba6e068fe75d94bfa8793827436e735f0d44551d738da045dc904edf0f"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/TrueTarget"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d016df89-de62-3c53-87ed-c06bb6a23cde",
"version": "v2019.4.4",
"python_path": "d3m.primitives.data_cleaning.imputer.SKlearn",
"name": "sklearn.impute.SimpleImputer",
"digest": "d7d1c2bd5b669ac4a01334504f92f970fab4bb10e62755a2081f843ae8829796"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.3.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"use_semantic_types": {
"type": "VALUE",
"data": true
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "f0fd7a62-09b5-3abc-93bb-f5f999f7cc80",
"version": "v2019.4.4",
"python_path": "d3m.primitives.regression.random_forest.SKlearn",
"name": "sklearn.ensemble.forest.RandomForestRegressor",
"digest": "d11179cee4ab21f3e6c0308775c5c5d22fc7a07dbceafeb9f86565c52d105765"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.5.produce"
},
"outputs": {
"type": "CONTAINER",
"data": "steps.4.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"use_semantic_types": {
"type": "VALUE",
"data": true