Commit 9c47dbda authored by Jarod Wang's avatar Jarod Wang Committed by Sujen

update pipelines

parent 8a1e2508
{
"id": "5fb46f32-7824-4eb4-9446-2a2c6f4254fb",
"schema": "https://metadata.datadrivendiscovery.org/schemas/v0/pipeline.json",
"created": "2019-06-20T14:50:50.855368Z",
"inputs": [
{
"name": "dataset inputs"
}
],
"outputs": [
{
"data": "steps.6.produce",
"name": "output predictions"
}
],
"steps": [
{
"type": "PRIMITIVE",
"primitive": {
"id": "4b42ce1e-9b98-4a25-b68e-fad13311eb65",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.dataset_to_dataframe.Common",
"name": "Extract a DataFrame from a Dataset",
"digest": "45f8322097914f9c95c4f9a8224d02db5d79b7166c74115e2eea7b23ccc13510"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "inputs.0"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d510cb7a-1782-4f51-b44c-58f0236e47c7",
"version": "0.5.0",
"python_path": "d3m.primitives.data_transformation.column_parser.DataFrameCommon",
"name": "Parses strings into their types",
"digest": "d41ad0c56ef55a233b21f4a4d8df1ac782aca7a78ef98dbfb72215690b3e9850"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "e91e0f7569ad53b6d4b8c01641f80fb0aa764b5dd3ae71dd2fbb433fa62c7f81"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/Attribute"
]
},
"exclude_columns": {
"type": "VALUE",
"data": [
1,
2,
3,
4,
5,
20,
21,
22,
23,
27
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "f410b951-1cb6-481c-8d95-2d97b31d411d",
"version": "3.0.1",
"python_path": "d3m.primitives.natural_language_processing.lda.Fastlvm",
"name": "Latent Dirichlet Allocation Topic Modelling",
"digest": "39c99a619277e94a465e579574a5002dd0ee7cc996b8f0fe7a2aa063881b42b7"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.2.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"k": {
"type": "VALUE",
"data": 100
},
"iters": {
"type": "VALUE",
"data": 100
},
"frac": {
"type": "VALUE",
"data": 0.001
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "e91e0f7569ad53b6d4b8c01641f80fb0aa764b5dd3ae71dd2fbb433fa62c7f81"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/TrueTarget"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "84f39131-6618-4d90-9590-b79d41dfb093",
"version": "2.2.1",
"python_path": "d3m.primitives.classification.search.Find_projections",
"name": "find projections",
"digest": "b7241a4d0044369436fd6a7d16650b67fb73811e68b1704a6d2b59034e0c3242"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.3.produce"
},
"outputs": {
"type": "CONTAINER",
"data": "steps.4.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "8d38b340-f83f-4877-baaa-162f8e551736",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.construct_predictions.DataFrameCommon",
"name": "Construct pipeline predictions output",
"digest": "53087aaa6baf0ccc96b6525ca5b79fd4e51b4cce996ab39773a9b0b3e746bf05"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.5.produce"
},
"reference": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
}
],
"digest": "5f4686530961dcee41f75cee332f68f3b61d37f919cb3f196021dea57ad5fcf8"
}
\ No newline at end of file
{
"problem": "LL0_acled_reduced_problem",
"full_inputs": [
"LL0_acled_reduced_dataset"
],
"train_inputs": [
"LL0_acled_reduced_dataset_TRAIN"
],
"test_inputs": [
"LL0_acled_reduced_dataset_TEST"
],
"score_inputs": [
"LL0_acled_reduced_dataset_SCORE"
]
}
\ No newline at end of file
{
"id": "9f557bc3-8160-46b8-bd27-17b2284e92f0",
"schema": "https://metadata.datadrivendiscovery.org/schemas/v0/pipeline.json",
"created": "2019-06-20T15:45:35.800944Z",
"inputs": [
{
"name": "dataset inputs"
}
],
"outputs": [
{
"data": "steps.6.produce",
"name": "output predictions"
}
],
"steps": [
{
"type": "PRIMITIVE",
"primitive": {
"id": "4b42ce1e-9b98-4a25-b68e-fad13311eb65",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.dataset_to_dataframe.Common",
"name": "Extract a DataFrame from a Dataset",
"digest": "45f8322097914f9c95c4f9a8224d02db5d79b7166c74115e2eea7b23ccc13510"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "inputs.0"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d510cb7a-1782-4f51-b44c-58f0236e47c7",
"version": "0.5.0",
"python_path": "d3m.primitives.data_transformation.column_parser.DataFrameCommon",
"name": "Parses strings into their types",
"digest": "d41ad0c56ef55a233b21f4a4d8df1ac782aca7a78ef98dbfb72215690b3e9850"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"parse_semantic_types": {
"type": "VALUE",
"data": [
"http://schema.org/Integer",
"http://schema.org/Float"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "e91e0f7569ad53b6d4b8c01641f80fb0aa764b5dd3ae71dd2fbb433fa62c7f81"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"http://schema.org/Integer",
"http://schema.org/Float"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d016df89-de62-3c53-87ed-c06bb6a23cde",
"version": "2019.6.7",
"python_path": "d3m.primitives.data_cleaning.imputer.SKlearn",
"name": "sklearn.impute.SimpleImputer",
"digest": "d6902b0ef72b4cd6fc5f79054f7a534404c708e1244e94a2713a9dd525c78eed"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.2.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"use_semantic_types": {
"type": "VALUE",
"data": true
},
"return_result": {
"type": "VALUE",
"data": "replace"
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "e91e0f7569ad53b6d4b8c01641f80fb0aa764b5dd3ae71dd2fbb433fa62c7f81"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/TrueTarget"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "84f39131-6618-4d90-9590-b79d41dfb093",
"version": "2.2.1",
"python_path": "d3m.primitives.classification.search.Find_projections",
"name": "find projections",
"digest": "b7241a4d0044369436fd6a7d16650b67fb73811e68b1704a6d2b59034e0c3242"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.3.produce"
},
"outputs": {
"type": "CONTAINER",
"data": "steps.4.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "8d38b340-f83f-4877-baaa-162f8e551736",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.construct_predictions.DataFrameCommon",
"name": "Construct pipeline predictions output",
"digest": "53087aaa6baf0ccc96b6525ca5b79fd4e51b4cce996ab39773a9b0b3e746bf05"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.5.produce"
},
"reference": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
]
}
],
"digest": "d385b0087fe3b0698622804d0a24108873b2f6766ec4e0cbc835c4ecad366848"
}
\ No newline at end of file
{
"problem": "1491_one_hundred_plants_margin_problem",
"full_inputs": [
"1491_one_hundred_plants_margin_dataset"
],
"train_inputs": [
"1491_one_hundred_plants_margin_dataset_TRAIN"
],
"test_inputs": [
"1491_one_hundred_plants_margin_dataset_TEST"
],
"score_inputs": [
"1491_one_hundred_plants_margin_dataset_SCORE"
]
}
\ No newline at end of file
{
"id": "b1ac84e3-32ef-4ae3-ade9-6e91547f0232",
"schema": "https://metadata.datadrivendiscovery.org/schemas/v0/pipeline.json",
"created": "2019-06-20T15:41:01.902934Z",
"inputs": [
{
"name": "dataset inputs"
}
],
"outputs": [
{
"data": "steps.7.produce",
"name": "output predictions"
}
],
"steps": [
{
"type": "PRIMITIVE",
"primitive": {
"id": "4b42ce1e-9b98-4a25-b68e-fad13311eb65",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.dataset_to_dataframe.Common",
"name": "Extract a DataFrame from a Dataset",
"digest": "45f8322097914f9c95c4f9a8224d02db5d79b7166c74115e2eea7b23ccc13510"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "inputs.0"
}
},
"outputs": [
{
"id": "produce"
}
]
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "d510cb7a-1782-4f51-b44c-58f0236e47c7",
"version": "0.5.0",
"python_path": "d3m.primitives.data_transformation.column_parser.DataFrameCommon",
"name": "Parses strings into their types",
"digest": "d41ad0c56ef55a233b21f4a4d8df1ac782aca7a78ef98dbfb72215690b3e9850"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.0.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"parse_semantic_types": {
"type": "VALUE",
"data": [
"http://schema.org/Integer",
"http://schema.org/Float"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "e91e0f7569ad53b6d4b8c01641f80fb0aa764b5dd3ae71dd2fbb433fa62c7f81"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/Attribute"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.3.0",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"name": "Extracts columns by semantic type",
"digest": "e91e0f7569ad53b6d4b8c01641f80fb0aa764b5dd3ae71dd2fbb433fa62c7f81"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.1.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"semantic_types": {
"type": "VALUE",
"data": [
"https://metadata.datadrivendiscovery.org/types/TrueTarget"
]
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "c977e879-1bf5-3829-b5b0-39b00233aff5",
"version": "2019.6.7",
"python_path": "d3m.primitives.data_transformation.one_hot_encoder.SKlearn",
"name": "sklearn.preprocessing.data.OneHotEncoder",
"digest": "24da929ef41fa43ca4a50c1b99d97733cb2b0bebb33ab8f82ebdc16cf7675524"
},
"arguments": {
"inputs": {
"type": "CONTAINER",
"data": "steps.2.produce"
}
},
"outputs": [
{
"id": "produce"
}
],
"hyperparams": {
"use_semantic_types": {
"type": "VALUE",
"data": true
},
"return_result": {
"type": "VALUE",
"data": "replace"
},
"handle_unknown": {
"type": "VALUE",
"data": "ignore"
}
}
},
{
"type": "PRIMITIVE",
"primitive": {
"id": "854727ed-c82c-3137-ac59-fd52bc9ba385",
"version": "2019.6.7",