{"@context":{"@language":"en","@vocab":"https://schema.org/","arrayShape":"cr:arrayShape","citeAs":"cr:citeAs","column":"cr:column","conformsTo":"dct:conformsTo","cr":"http://mlcommons.org/croissant/","data":{"@id":"cr:data","@type":"@json"},"dataBiases":"cr:dataBiases","dataCollection":"cr:dataCollection","dataType":{"@id":"cr:dataType","@type":"@vocab"},"dct":"http://purl.org/dc/terms/","extract":"cr:extract","field":"cr:field","fileProperty":"cr:fileProperty","fileObject":"cr:fileObject","fileSet":"cr:fileSet","format":"cr:format","includes":"cr:includes","isArray":"cr:isArray","isLiveDataset":"cr:isLiveDataset","jsonPath":"cr:jsonPath","key":"cr:key","md5":"cr:md5","parentField":"cr:parentField","path":"cr:path","personalSensitiveInformation":"cr:personalSensitiveInformation","recordSet":"cr:recordSet","references":"cr:references","regex":"cr:regex","repeated":"cr:repeated","replace":"cr:replace","sc":"https://schema.org/","separator":"cr:separator","source":"cr:source","subField":"cr:subField","transform":"cr:transform"},"@type":"sc:Dataset","distribution":[{"@type":"cr:FileObject","@id":"repo","name":"repo","description":"The Hugging Face git repository.","contentUrl":"https://huggingface.co/datasets/TalBarami/msd_bms_air_quality/tree/refs%2Fconvert%2Fparquet","encodingFormat":"git+https","sha256":"https://github.com/mlcommons/croissant/issues/80"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-default","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"default/*/*.parquet"}],"recordSet":[{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"default_splits/split_name"},"@id":"default_splits","name":"default_splits","description":"Splits for the default config.","field":[{"@type":"cr:Field","@id":"default_splits/split_name","dataType":"sc:Text"}],"data":[{"default_splits/split_name":"train"},{"default_splits/split_name":"val"},{"default_splits/split_name":"test"}]},{"@type":"cr:RecordSet","@id":"default","description":"TalBarami/msd_bms_air_quality - 'default' subset\n\nAdditional information:\n- 3 splits: train, val, test\n- 1 skipped column: x","field":[{"@type":"cr:Field","@id":"default/split","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"default/(?:partial-)?(train|val|test)/.+parquet$"}},"references":{"field":{"@id":"default_splits/split_name"}}},{"@type":"cr:Field","@id":"default/id","dataType":"cr:Int32","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"id"}}},{"@type":"cr:Field","@id":"default/station","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"station"}}},{"@type":"cr:Field","@id":"default/year","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"year"}}},{"@type":"cr:Field","@id":"default/month","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"month"}}},{"@type":"cr:Field","@id":"default/day","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"day"}}},{"@type":"cr:Field","@id":"default/season","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"season"}}}]}],"conformsTo":"http://mlcommons.org/croissant/1.1","name":"msd_bms_air_quality","description":"\n\t\n\t\t\n\t\tMSD Beijing Multi-Site Air Quality Dataset Attribution\n\t\n\nThe Multi-factor Sequential Disentanglement benchmark includes the Beijing Multi-Site Air Quality (BMS-AQ) dataset, a time series dataset that captures daily air quality and weather measurements across multiple monitoring stations in Beijing.\nFor the benchmark, we preprocess this data into daily sequences of 24 hourly records, grouped by station and date.\nEach sequence is labeled with static attributes such as station, year… See the full description on the dataset page: https://huggingface.co/datasets/TalBarami/msd_bms_air_quality.","alternateName":["TalBarami/msd_bms_air_quality"],"creator":{"@type":"Person","name":"Tal Barami","url":"https://huggingface.co/TalBarami"},"keywords":["apache-2.0","10K - 100K","parquet","Datasets","pandas","Croissant","Polars","🇺🇸 Region: US"],"license":"https://choosealicense.com/licenses/apache-2.0/","url":"https://huggingface.co/datasets/TalBarami/msd_bms_air_quality"}