Commit c287f68d authored by Mitar's avatar Mitar

New version of common primitives.

parent b2933b97
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -622,5 +622,5 @@
},
"structural_type": "common_primitives.lgbm_classifier.LightGBMClassifierPrimitive",
"description": "A lightGBM classifier using ``lgbm.LGBMClassifier``.\n\nIt uses semantic types to determine which columns to operate on.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "b1af2f5c142e1d4c9bbda7f8eced4586777aab58339918d3712e931334cf8fae"
"digest": "efb1d7bd23c42e987d4a6fbb4764c93fd13814c0a19b18a2b3c06cd1c1f9eee4"
}
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -648,5 +648,5 @@
},
"structural_type": "common_primitives.random_forest.RandomForestClassifierPrimitive",
"description": "A random forest classifier using ``sklearn.ensemble.forest.RandomForestClassifier``.\n\nIt uses semantic types to determine which columns to operate on.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "a4cdc23120dbf003528b26c405e2dac56b356e4eacc8ccb3f003aa69c0d10562"
"digest": "8217a2914b50260e829441d95e047ffc2876f4195e2ff15bb7e0e5854aab066f"
}
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -664,5 +664,5 @@
},
"structural_type": "common_primitives.xgboost_dart.XGBoostDartClassifierPrimitive",
"description": "A XGBoost classifier using ``xgb.XGBoostClassifier`` with Dart Boosting type.\n\nIt uses semantic types to determine which columns to operate on.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "2118164cce45c0c5502bdd5b29e17d87c98cb008e72b8f41d1395c86feab3ea6"
"digest": "1294d522eac6259ab4f254ed15000a816bb1537d0556b27ebf7c686f4a2e4010"
}
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -625,5 +625,5 @@
},
"structural_type": "common_primitives.xgboost_gbtree.XGBoostGBTreeClassifierPrimitive",
"description": "A XGBoost classifier using ``xgb.XGBoostClassifier`` with GBTree Boosting type.\n\nIt uses semantic types to determine which columns to operate on.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "81b1a7044183501031d8442bccea50751a8f1ce1ad7f94ef17f4e5a702054937"
"digest": "cc13bca601923fb7fa00855c12b7e42b72777242c74c4e864d843a99346f0649"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -228,5 +228,5 @@
},
"structural_type": "common_primitives.datamart_augment.DataMartAugmentPrimitive",
"description": "Augment supplied dataset with additional columns.\n\nUse ``DATAMART_NYU_URL`` and ``DATAMART_ISI_URL`` environment variables to control where\ncan the primitive connect to respective DataMarts.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "6ec50b4cfaef6a751ab2a3cb67b618bd778d07fa02efc86d447b874e73a8bf9e"
"digest": "37c867c5c53e40d34b725d97bafb00fb816987f8d224c74412e7256a93f94fa3"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -203,5 +203,5 @@
},
"structural_type": "common_primitives.datamart_download.DataMartDownloadPrimitive",
"description": "Download a dataset from DataMart.\n\nUse ``DATAMART_NYU_URL`` and ``DATAMART_ISI_URL`` environment variables to control where\ncan the primitive connect to respective DataMarts.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "efe7739e67e09a79952da8fbc00fdde111ded1d57a6ad22db48aab87513e6cbe"
"digest": "c0246225ec2e069ab810666e5d8091e741f5eb25ab50eec73419c6904e6ca9e9"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -211,5 +211,5 @@
},
"structural_type": "common_primitives.tabular_extractor.AnnotatedTabularExtractorPrimitive",
"description": "A primitive wrapping for MIT-LL slacker's ``AnnotatedTabularExtractor``.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "45f1a2ecb61e3249a7edabcf73fd28f37dd90ad491ba04a50c420aeb267bc64e"
"digest": "6d3199ef33f04862ef694c6b9046fd316b91d69d95d7997e4150f00489524f27"
}
......@@ -43,7 +43,7 @@
},
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -261,5 +261,5 @@
},
"structural_type": "common_primitives.audio_reader.AudioReaderPrimitive",
"description": "A primitive which reads columns referencing audio files.\n\nEach column which has ``https://metadata.datadrivendiscovery.org/types/FileName`` semantic type\nand a valid media type (``audio/aiff``, ``audio/flac``, ``audio/ogg``, ``audio/wav``, ``audio/mpeg``)\nhas every filename read into an audio represented as a numpy array. By default the resulting column\nwith read arrays is appended to existing columns.\n\nThe shape of numpy arrays is S x C. S is the number of samples, C is the number of\nchannels in an audio (e.g., C = 1 for mono, C = 2 for stereo). dtype is float32.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "0b640ad037c928dd0a36255ef5c8718576c4cad773470d07e5214cbac1eee696"
"digest": "683e9d72a38dc42cb854231af50442b8fa238b78eadce091303d9f29eb4b50a0"
}
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -232,5 +232,5 @@
},
"structural_type": "common_primitives.csv_reader.CSVReaderPrimitive",
"description": "A primitive which reads columns referencing CSV files.\n\nEach column which has ``https://metadata.datadrivendiscovery.org/types/FileName`` semantic type\nand a valid media type (``text/csv``) has every filename read as a pandas DataFrame. By default\nthe resulting column with read pandas DataFrames is appended to existing columns.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "9331fcf4c91e5f4d77b22abc9a0c314d230af1f726e5ac03db102cf57a3f4f97"
"digest": "3238b4371c791a29afcee675ff4027f2f0922505469e1f974283724e7931d420"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -266,5 +266,5 @@
},
"structural_type": "common_primitives.datetime_range_filter.DatetimeRangeFilterPrimitive",
"description": "A primitive which filters rows from a DataFrame based on a datetime range applied to a given column.\nColumns are identified by their index, and the filter itself can be inclusive (values within range are retained)\nor exclusive (values within range are removed). Boundaries values can be included in the filter (ie. <=) or excluded\n(ie. <).\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "e4a717dc91b2be3eb886615bc6668c0e09a1a40a58c4abfa75b254372602fd80"
"digest": "03896c6e9b8dd5d81248e9d299255ac6019da3e947b8ad27d2d4f920ecdc3f04"
}
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -262,5 +262,5 @@
},
"structural_type": "common_primitives.dataframe_flatten.DataFrameFlattenPrimitive",
"description": "Cycles through the input dataframe and flattens the encountered nested structures (series & dataframes).\nFlattening involves creating a new row for each nested data row, and replicating the unnested row features.\n[\n a, b, [w, x],\n c, d, [y, z],\n]\n\nyields:\n\n[\n a, b, w,\n a, b, x,\n c, d, y,\n c, d, z\n]\n\nIf the d3m index field is present and set as index, it will be updated to be multi index\nas needed. The primitive should be called after the referenced files have\nalready been nested in the dataframe (using the CSVReader primitive for example). The primitive can\nflatten mutiple nested columns, but is currently limited to supporting a nesting depth of 1.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "d4f0d2e28ee4f83ecff11e46e3e2ccdbd0af23908453ef7d51d9827b860a1202"
"digest": "94c6dd0b0c30bf364da943f42998c5233ffda0734c2301dba3885b1b45e0e64a"
}
......@@ -20,7 +20,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -235,5 +235,5 @@
},
"structural_type": "common_primitives.dataframe_image_reader.DataFrameImageReaderPrimitive",
"description": "A primitive which reads columns referencing image files.\n\nEach column which has ``https://metadata.datadrivendiscovery.org/types/FileName`` semantic type\nand a valid media type (``image/jpeg``, ``image/png``) has every filename read into an image\nrepresented as a numpy array. By default the resulting column with read arrays is appended\nto existing columns.\n\nThe shape of numpy arrays is H x W x C. C is the number of channels in an image\n(e.g., C = 1 for greyscale, C = 3 for RGB), H is the height, and W is the width.\ndtype is uint8.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "4d08472cb2054e39e07bb0fc377fdfc971517e55beed48f4db6c64276694cad6"
"digest": "1c7453b0d46b0928e707f68fcb7e44500335240d2263b5a9518023badbee015a"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -262,5 +262,5 @@
},
"structural_type": "common_primitives.unseen_label_decoder.UnseenLabelDecoderPrimitive",
"description": "A primitive which inverses the label encoding by ``UnseenLabelEncoderPrimitive``.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "80c99c8068f6e8613f55eb07edb743d68360c3d03a4f2e9fb003efbf3c61f8d7"
"digest": "6f3074584102aad657248655b342b80114fef0adb001cfdb2a6cf05757461f2c"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -240,5 +240,5 @@
},
"structural_type": "common_primitives.unseen_label_encoder.UnseenLabelEncoderPrimitive",
"description": "Label encoder that can puts any unseen categories into a single category.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "ca16dad447c1d670e04a33456925c70f121c79c461da053fba4c4ca4de072cf6"
"digest": "efee5468b4cabf6cd29f576e417e41a3f615b3c7300d1078570173083b3cf3c7"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -266,5 +266,5 @@
},
"structural_type": "common_primitives.numeric_range_filter.NumericRangeFilterPrimitive",
"description": "A primitive which filters rows from a DataFrame based on a numeric range applied to a given column.\nColumns are identified by their index, and the filter itself can be inclusive (values within range are retained)\nor exclusive (values within range are removed). Boundaries values can be included in the filter (ie. <=) or excluded\n(ie. <).\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "4de632567b17ff3c9b6defbc95496ee6ec1ea1b324138d78928a5f55d85d53be"
"digest": "04c76d6ec5aad5b47b29c4198d8aa5085f88fe4636fae63d9f7aff5bd1b893da"
}
......@@ -17,7 +17,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"python_path": "d3m.primitives.data_preprocessing.one_hot_encoder.MakerCommon",
......@@ -295,5 +295,5 @@
},
"structural_type": "common_primitives.one_hot_maker.OneHotMakerPrimitive",
"description": "Attempts to detect discrete values in data and convert these to a\none-hot embedding.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "8b19e9d7491b730cc2554f4f296787d686ce6443393f9c932827190dfd63e1de"
"digest": "e534452530096b269f63f9bdacdcc84f6817ab9264a89a8e85593c1ee1ce8f74"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common-primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common-primitives"
}
],
"algorithm_types": [
......@@ -257,5 +257,5 @@
},
"structural_type": "common_primitives.pandas_onehot_encoder.PandasOneHotEncoderPrimitive",
"description": "One-hot encoder using Pandas implementation.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "cd2bfb647f9467f7ff62ce05a7b097ce25d5f9fa532e1f816b77c85b06e13682"
"digest": "1baa4e6621504ff5d12e860950f86b2ea53aa8988baea69154b9eb4ec411b4cc"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -220,5 +220,5 @@
},
"structural_type": "common_primitives.regex_filter.RegexFilterPrimitive",
"description": "A primitive which filters rows from a DataFrame based on a regex applied to a given column.\nColumns are identified by index.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "9f15c69fccab23548598b286693a57e39e6ad88d31b1fcfeddcdccd1a2c27427"
"digest": "6db3aa49e6765aceb4623f0f9553ecf53d9453c02bfa428c81d8bd730278881e"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -237,5 +237,5 @@
},
"structural_type": "common_primitives.term_filter.TermFilterPrimitive",
"description": "A primitive which filters rows from a DataFrame based on a column value containing a match\nagainst a caller supplied term list. Supports search-style matching where the target need only\ncontain a term, as well as whole word matching where the target is tokenized using regex word boundaries.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "35289f87dfef70e1436ed679f938c95fbf20471426a19b832077a541c930a8aa"
"digest": "b2e55256986f6cf164206e067cc51b223ed7e220ee4cd2ce485ceb59b89bb6ae"
}
......@@ -19,7 +19,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -233,5 +233,5 @@
},
"structural_type": "common_primitives.text_reader.TextReaderPrimitive",
"description": "A primitive which reads columns referencing plain text files.\n\nEach column which has ``https://metadata.datadrivendiscovery.org/types/FileName`` semantic type\nand a valid media type (``text/plain``) has every filename read as a Python string. By default\nthe resulting column with read strings is appended to existing columns.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "ba1c5428f0d55fc2211244e043647283b264e8498aaa346fb7176c56ab3df7ba"
"digest": "d946eda4c9f640f028775d651ec71ce29fd71026713987184e4e71f4aff96dda"
}
......@@ -20,7 +20,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -235,5 +235,5 @@
},
"structural_type": "common_primitives.video_reader.VideoReaderPrimitive",
"description": "A primitive which reads columns referencing video files.\n\nEach column which has ``https://metadata.datadrivendiscovery.org/types/FileName`` semantic type\nand a valid media type (``video/mp4``, ``video/avi``) has every filename read into a video\nrepresented as a numpy array. By default the resulting column with read arrays is appended\nto existing columns.\n\nThe shape of numpy arrays is F x H x W x C. F is the number of frames, C is the number of\nchannels in a video (e.g., C = 1 for greyscale, C = 3 for RGB), H is the height, and W\nis the width. dtype is uint8.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "5a2961b4974a1af0dd503f90259474c6e5ed44a9a61a44163de9c8560d606b63"
"digest": "714e300e49931cd4cefb2a4e05d6859b59415c803667da77083bbf9e6db3fea8"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -227,5 +227,5 @@
},
"structural_type": "common_primitives.add_semantic_types.AddSemanticTypesPrimitive",
"description": "A primitive which adds semantic types for columns in a DataFrame.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "6fd5d1b397e8fee534b3db07ac739f660c9458767beddaf3b808a809d8a2f826"
"digest": "344f44f49f284dead2978baeefabaad4ab161d39686eb7f3eea678ebdb85c3c7"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -239,5 +239,5 @@
},
"structural_type": "common_primitives.cast_to_type.CastToTypePrimitive",
"description": "A primitive which casts all columns it can cast (by default, controlled by ``use_columns``,\n``exclude_columns``) of an input DataFrame to a given structural type (dtype).\nIt removes columns which are not cast.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "47897c2e8ac89371f3d162de714e094280da05c0a8faf6460bd473dabf8a6ff7"
"digest": "0addfa0f64002cc36611dd107635bcda3e43929597e2730698c72a48ded6656e"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -300,5 +300,5 @@
},
"structural_type": "common_primitives.column_parser.ColumnParserPrimitive",
"description": "A primitive which parses strings into their parsed values.\n\nIt goes over all columns (by default, controlled by ``use_columns``, ``exclude_columns``)\nand checks those with structural type ``str`` if they have a semantic type suggesting\nthat they are a boolean value, categorical, integer, float, or time (by default,\ncontrolled by ``parse_semantic_types``). Categorical values are converted with\nhash encoding.\n\nWhat is returned is controlled by ``return_result`` and ``add_index_columns``.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "7e16e2b1e559690e221de471826d7d1cd36698bc5140dc00f3c7a6c6b711c3b2"
"digest": "3756019a006c00b84ff31ffd39b19eb787b2e857932c8e41e2959b27629ac9e3"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -234,5 +234,5 @@
},
"structural_type": "common_primitives.construct_predictions.ConstructPredictionsPrimitive",
"description": "A primitive which takes as input a DataFrame and outputs a DataFrame in Lincoln Labs predictions\nformat: first column is a d3mIndex column (and other primary index columns, e.g., for object detection\nproblem), and then predicted targets, each in its column, followed by optional confidence column(s).\n\nIt supports both input columns annotated with semantic types (``https://metadata.datadrivendiscovery.org/types/PrimaryKey``,\n``https://metadata.datadrivendiscovery.org/types/PrimaryMultiKey``, ``https://metadata.datadrivendiscovery.org/types/PredictedTarget``,\n``https://metadata.datadrivendiscovery.org/types/Confidence``), or trying to reconstruct metadata.\nThis is why the primitive takes also additional input of a reference DataFrame which should\nhave metadata to help reconstruct missing metadata. If metadata is missing, the primitive\nassumes that all ``inputs`` columns are predicted targets, without confidence column(s).\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "077921b0d6cee9bbda9494bc60c8b48f8287db8d0bff674056a7c9e5cc92ebb9"
"digest": "c050f53d2dc380996e18f7d4bfd2902f9e3243e2a7d3b4dc2972b4bdc3a7e32b"
}
......@@ -18,7 +18,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -255,5 +255,5 @@
},
"structural_type": "common_primitives.cut_audio.CutAudioPrimitive",
"description": "A primitive which uses boundary columns to cut audio columns.\n\nIt uses ``http://schema.org/AudioObject`` and structural type ``container.ndarray` to\nfind columns with audio data.\n\nIt searches for boundary columns referencing them.\nBoundary columns are identified by ``https://metadata.datadrivendiscovery.org/types/Interval``,\n``https://metadata.datadrivendiscovery.org/types/IntervalStart`` and\n``https://metadata.datadrivendiscovery.org/types/IntervalEnd`` semantic types.\n\nIt requires that the audio dimension has ``sampling_rate`` metadata set.\n\nBoundaries are rounded down to samples. Cut is done exclusive: not including the last sample.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "a76273b1859fb13e8ca563af72cf511fcd18ed369ed4a5a3d782fd09bab62c38"
"digest": "57920b5ddde33e0c5564ed9ed48da1ae11dae6d32e44a9fa1d0d1df488db51cd"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -192,5 +192,5 @@
},
"structural_type": "common_primitives.dataframe_to_list.DataFrameToListPrimitive",
"description": "A primitive which converts a pandas dataframe into a list of rows.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "358be2c69beb94372f19831005066df28aa4b6df47de93aba34c591afb41ad4c"
"digest": "fe7a063eafc8a27feb40c1ce117bf02eb6c3a090f8917ed8e5bd6cce04437ae9"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -192,5 +192,5 @@
},
"structural_type": "common_primitives.dataframe_to_ndarray.DataFrameToNDArrayPrimitive",
"description": "A primitive which converts a pandas dataframe into a numpy array.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "32594c9a3c9bdc6315463fa8c169b18379b7fda7115354360de0d96298cf1960"
"digest": "508ada3d2ede1203cbd260773dfbdecd56754938b22fedf15bd396c6f8dd75a9"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -202,5 +202,5 @@
},
"structural_type": "common_primitives.dataset_to_dataframe.DatasetToDataFramePrimitive",
"description": "A primitive which extracts a DataFrame out of a Dataset.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "e557fc176af67913ed241dbe793cf986439157cfe9c4a12f1aafcba3c07b8b6f"
"digest": "3c3bdf07b4068bcb08f8ec614619f228234e1da3903f89b8d5ab0b1534180ca6"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -228,5 +228,5 @@
},
"structural_type": "common_primitives.datetime_field_compose.DatetimeFieldComposePrimitive",
"description": "A primitive which composes fields into a new single datetime field.\n\nThe primitve joins the columns (identified in the columns hyperparam) in order and then parses\nthe resulting string as a datetime. The value is stored in a new column.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "b60ed4233420a7198d1b079dbc5b21279a68c710a2c246b4b9f9a5168ab2476a"
"digest": "d173b830ceb5f4c0690dd8a6c5a071368d3fdd8df37d0c3e814b43529ceedb5c"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -204,5 +204,5 @@
},
"structural_type": "common_primitives.denormalize.DenormalizePrimitive",
"description": "A primitive which converts a Dataset with multiple tabular resources into a Dataset with only one tabular resource,\nbased on known relations between tabular resources. Any resource which can be joined is joined (thus the resource\nitself is removed), and other resources are by default discarded (controlled by ``discard_resources`` hyper-parameter).\n\nIf hyper-parameter ``recursive`` is set to ``True``, the primitive will join tables recursively. For example,\nif table 1 (main table) has a foreign key that points to table 2, and table 2 has a foreign key that points to table 3,\nthen after table 2 is jointed into table 1, table 1 will have a foreign key that points to table 3. So now the\nprimitive continues to join table 3 into the main table.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "afca078f05899b9f329e1b8cc0973848e39e83a7521d2cade81c1fbad5cf8139"
"digest": "ee3c396a46dd1ba3a330ec020c302402ae0bbf476e81e72ea4e7fd8ab46c8541"
}
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -210,5 +210,5 @@
},
"structural_type": "common_primitives.extract_columns.ExtractColumnsPrimitive",
"description": "A primitive which extracts a fixed list of columns.\n\nAttributes\n----------\nmetadata : PrimitiveMetadata\n Primitive's metadata. Available as a class attribute.\nlogger : Logger\n Primitive's logger. Available as a class attribute.\nhyperparams : Hyperparams\n Hyperparams passed to the constructor.\nrandom_seed : int\n Random seed passed to the constructor.\ndocker_containers : Dict[str, DockerContainer]\n A dict mapping Docker image keys from primitive's metadata to (named) tuples containing\n container's address under which the container is accessible by the primitive, and a\n dict mapping exposed ports to ports on that address.\nvolumes : Dict[str, str]\n A dict mapping volume keys from primitive's metadata to file and directory paths\n where downloaded and extracted files are available to the primitive.\ntemporary_directory : str\n An absolute path to a temporary directory a primitive can use to store any files\n for the duration of the current pipeline run phase. Directory is automatically\n cleaned up after the current pipeline run phase finishes.",
"digest": "a3c6012878b3cc2781d53b59d3a559cbb5bd2a6c6022ca754cff0ec84be3a534"
"digest": "1601b86899a0b5aef57d18bba93b14bfb62516a9dacb59c805bb514dc6e4a15b"
}
{
"id": "4503a4c6-42f7-45a1-a1d4-ed69699cf5e1",
"version": "0.2.0",
"version": "0.3.0",
"name": "Extracts columns by semantic type",
"python_path": "d3m.primitives.data_transformation.extract_columns_by_semantic_types.DataFrameCommon",
"source": {
......@@ -14,7 +14,7 @@
"installation": [
{
"type": "PIP",
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@6deddfd1e81f0d391f8d097aefe22b195d358b84#egg=common_primitives"
"package_uri": "git+https://gitlab.com/datadrivendiscovery/common-primitives.git@574444f11bd933d430cf8f398eda3b18279ff97b#egg=common_primitives"
}
],
"algorithm_types": [
......@@ -45,7 +45,7 @@
"semantic_types": [
"https://metadata.datadrivendiscovery.org/types/ControlParameter"
],
"description": "Semantic types to use to extract columns. If any of them matches.",
"description": "Semantic types to use to extract columns. If any of them matches, by default.",
"elements": {
"type": "d3m.metadata.hyperparams.Hyperparameter",
"default": "",
......@@ -55,6 +55,28 @@
"is_configuration": false,
"min_size": 1
},
"match_logic": {
"type": "d3m.metadata.hyperparams.Enumeration",
"default": "any",
"structural_type": "str",
"semantic_types": [
"https://metadata.datadrivendiscovery.org/types/ControlParameter"
],
"description": "Should a column have all of semantic types in \"semantic_types\" to be extracted, or any of them?",
"values": [
"all",
"any"
]
},
"negate": {
"type": "d3m.metadata.hyperparams.UniformBool",
"default": false,
"structural_type": "bool",
"semantic_types": [
"https://metadata.datadrivendiscovery.org/types/ControlParameter"
],
"description": "Should columns which do not match semantic types in \"semantic_types\" be extracted?"
},
"use_columns": {