{"@context":{"@language":"en","@vocab":"https://schema.org/","citeAs":"cr:citeAs","column":"cr:column","conformsTo":"dct:conformsTo","cr":"http://mlcommons.org/croissant/","data":{"@id":"cr:data","@type":"@json"},"dataBiases":"cr:dataBiases","dataCollection":"cr:dataCollection","dataType":{"@id":"cr:dataType","@type":"@vocab"},"dct":"http://purl.org/dc/terms/","extract":"cr:extract","field":"cr:field","fileProperty":"cr:fileProperty","fileObject":"cr:fileObject","fileSet":"cr:fileSet","format":"cr:format","includes":"cr:includes","isLiveDataset":"cr:isLiveDataset","jsonPath":"cr:jsonPath","key":"cr:key","md5":"cr:md5","parentField":"cr:parentField","path":"cr:path","personalSensitiveInformation":"cr:personalSensitiveInformation","recordSet":"cr:recordSet","references":"cr:references","regex":"cr:regex","repeated":"cr:repeated","replace":"cr:replace","sc":"https://schema.org/","separator":"cr:separator","source":"cr:source","subField":"cr:subField","transform":"cr:transform"},"@type":"sc:Dataset","distribution":[{"@type":"cr:FileObject","@id":"repo","name":"repo","description":"The Hugging Face git repository.","contentUrl":"https://huggingface.co/datasets/JetBrains-Research/lca-bug-localization/tree/refs%2Fconvert%2Fparquet","encodingFormat":"git+https","sha256":"https://github.com/mlcommons/croissant/issues/80"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-java","name":"parquet-files-for-config-java","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"java/*/*.parquet"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-kt","name":"parquet-files-for-config-kt","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"kt/*/*.parquet"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-py","name":"parquet-files-for-config-py","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"py/*/*.parquet"}],"recordSet":[{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"java_splits/split_name"},"@id":"java_splits","name":"java_splits","description":"Splits for the java config.","field":[{"@type":"cr:Field","@id":"java_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"java_splits/split_name":"dev"},{"java_splits/split_name":"test"},{"java_splits/split_name":"train"}]},{"@type":"cr:RecordSet","@id":"java","name":"java","description":"JetBrains-Research/lca-bug-localization - 'java' subset\n\nAdditional information:\n- 3 splits: dev, test, train\n- 1 skipped column: pull_create_at","field":[{"@type":"cr:Field","@id":"java/split","name":"java/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"java/(?:partial-)?(dev|test|train)/.+parquet$"}},"references":{"field":{"@id":"java_splits/split_name"}}},{"@type":"cr:Field","@id":"java/id","name":"java/id","description":"Column 'id' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"id"}}},{"@type":"cr:Field","@id":"java/text_id","name":"java/text_id","description":"Column 'text_id' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"text_id"}}},{"@type":"cr:Field","@id":"java/repo_owner","name":"java/repo_owner","description":"Column 'repo_owner' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_owner"}}},{"@type":"cr:Field","@id":"java/repo_name","name":"java/repo_name","description":"Column 'repo_name' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_name"}}},{"@type":"cr:Field","@id":"java/issue_url","name":"java/issue_url","description":"Column 'issue_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_url"}}},{"@type":"cr:Field","@id":"java/pull_url","name":"java/pull_url","description":"Column 'pull_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"pull_url"}}},{"@type":"cr:Field","@id":"java/comment_url","name":"java/comment_url","description":"Column 'comment_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"comment_url"}}},{"@type":"cr:Field","@id":"java/links_count","name":"java/links_count","description":"Column 'links_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"links_count"}}},{"@type":"cr:Field","@id":"java/link_keyword","name":"java/link_keyword","description":"Column 'link_keyword' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"link_keyword"}}},{"@type":"cr:Field","@id":"java/issue_title","name":"java/issue_title","description":"Column 'issue_title' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_title"}}},{"@type":"cr:Field","@id":"java/issue_body","name":"java/issue_body","description":"Column 'issue_body' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_body"}}},{"@type":"cr:Field","@id":"java/base_sha","name":"java/base_sha","description":"Column 'base_sha' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"base_sha"}}},{"@type":"cr:Field","@id":"java/head_sha","name":"java/head_sha","description":"Column 'head_sha' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"head_sha"}}},{"@type":"cr:Field","@id":"java/diff_url","name":"java/diff_url","description":"Column 'diff_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"diff_url"}}},{"@type":"cr:Field","@id":"java/diff","name":"java/diff","description":"Column 'diff' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"diff"}}},{"@type":"cr:Field","@id":"java/changed_files","name":"java/changed_files","description":"Column 'changed_files' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_files"}}},{"@type":"cr:Field","@id":"java/changed_files_exts","name":"java/changed_files_exts","description":"Column 'changed_files_exts' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_files_exts"}}},{"@type":"cr:Field","@id":"java/changed_files_count","name":"java/changed_files_count","description":"Column 'changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_files_count"}}},{"@type":"cr:Field","@id":"java/java_changed_files_count","name":"java/java_changed_files_count","description":"Column 'java_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"java_changed_files_count"}}},{"@type":"cr:Field","@id":"java/kt_changed_files_count","name":"java/kt_changed_files_count","description":"Column 'kt_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"kt_changed_files_count"}}},{"@type":"cr:Field","@id":"java/py_changed_files_count","name":"java/py_changed_files_count","description":"Column 'py_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"py_changed_files_count"}}},{"@type":"cr:Field","@id":"java/code_changed_files_count","name":"java/code_changed_files_count","description":"Column 'code_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"code_changed_files_count"}}},{"@type":"cr:Field","@id":"java/repo_symbols_count","name":"java/repo_symbols_count","description":"Column 'repo_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_symbols_count"}}},{"@type":"cr:Field","@id":"java/repo_tokens_count","name":"java/repo_tokens_count","description":"Column 'repo_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_tokens_count"}}},{"@type":"cr:Field","@id":"java/repo_lines_count","name":"java/repo_lines_count","description":"Column 'repo_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_lines_count"}}},{"@type":"cr:Field","@id":"java/repo_files_without_tests_count","name":"java/repo_files_without_tests_count","description":"Column 'repo_files_without_tests_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_files_without_tests_count"}}},{"@type":"cr:Field","@id":"java/changed_symbols_count","name":"java/changed_symbols_count","description":"Column 'changed_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_symbols_count"}}},{"@type":"cr:Field","@id":"java/changed_tokens_count","name":"java/changed_tokens_count","description":"Column 'changed_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_tokens_count"}}},{"@type":"cr:Field","@id":"java/changed_lines_count","name":"java/changed_lines_count","description":"Column 'changed_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_lines_count"}}},{"@type":"cr:Field","@id":"java/changed_files_without_tests_count","name":"java/changed_files_without_tests_count","description":"Column 'changed_files_without_tests_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"changed_files_without_tests_count"}}},{"@type":"cr:Field","@id":"java/issue_symbols_count","name":"java/issue_symbols_count","description":"Column 'issue_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_symbols_count"}}},{"@type":"cr:Field","@id":"java/issue_words_count","name":"java/issue_words_count","description":"Column 'issue_words_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_words_count"}}},{"@type":"cr:Field","@id":"java/issue_tokens_count","name":"java/issue_tokens_count","description":"Column 'issue_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_tokens_count"}}},{"@type":"cr:Field","@id":"java/issue_lines_count","name":"java/issue_lines_count","description":"Column 'issue_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_lines_count"}}},{"@type":"cr:Field","@id":"java/issue_links_count","name":"java/issue_links_count","description":"Column 'issue_links_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_links_count"}}},{"@type":"cr:Field","@id":"java/issue_code_blocks_count","name":"java/issue_code_blocks_count","description":"Column 'issue_code_blocks_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"issue_code_blocks_count"}}},{"@type":"cr:Field","@id":"java/repo_stars","name":"java/repo_stars","description":"Column 'repo_stars' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_stars"}}},{"@type":"cr:Field","@id":"java/repo_language","name":"java/repo_language","description":"Column 'repo_language' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_language"}}},{"@type":"cr:Field","@id":"java/repo_languages","name":"java/repo_languages","description":"Column 'repo_languages' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_languages"}}},{"@type":"cr:Field","@id":"java/repo_license","name":"java/repo_license","description":"Column 'repo_license' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-java"},"extract":{"column":"repo_license"}}}]},{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"kt_splits/split_name"},"@id":"kt_splits","name":"kt_splits","description":"Splits for the kt config.","field":[{"@type":"cr:Field","@id":"kt_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"kt_splits/split_name":"dev"},{"kt_splits/split_name":"test"},{"kt_splits/split_name":"train"}]},{"@type":"cr:RecordSet","@id":"kt","name":"kt","description":"JetBrains-Research/lca-bug-localization - 'kt' subset\n\nAdditional information:\n- 3 splits: dev, test, train\n- 1 skipped column: pull_create_at","field":[{"@type":"cr:Field","@id":"kt/split","name":"kt/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"kt/(?:partial-)?(dev|test|train)/.+parquet$"}},"references":{"field":{"@id":"kt_splits/split_name"}}},{"@type":"cr:Field","@id":"kt/id","name":"kt/id","description":"Column 'id' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"id"}}},{"@type":"cr:Field","@id":"kt/text_id","name":"kt/text_id","description":"Column 'text_id' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"text_id"}}},{"@type":"cr:Field","@id":"kt/repo_owner","name":"kt/repo_owner","description":"Column 'repo_owner' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_owner"}}},{"@type":"cr:Field","@id":"kt/repo_name","name":"kt/repo_name","description":"Column 'repo_name' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_name"}}},{"@type":"cr:Field","@id":"kt/issue_url","name":"kt/issue_url","description":"Column 'issue_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_url"}}},{"@type":"cr:Field","@id":"kt/pull_url","name":"kt/pull_url","description":"Column 'pull_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"pull_url"}}},{"@type":"cr:Field","@id":"kt/comment_url","name":"kt/comment_url","description":"Column 'comment_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"comment_url"}}},{"@type":"cr:Field","@id":"kt/links_count","name":"kt/links_count","description":"Column 'links_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"links_count"}}},{"@type":"cr:Field","@id":"kt/link_keyword","name":"kt/link_keyword","description":"Column 'link_keyword' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"link_keyword"}}},{"@type":"cr:Field","@id":"kt/issue_title","name":"kt/issue_title","description":"Column 'issue_title' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_title"}}},{"@type":"cr:Field","@id":"kt/issue_body","name":"kt/issue_body","description":"Column 'issue_body' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_body"}}},{"@type":"cr:Field","@id":"kt/base_sha","name":"kt/base_sha","description":"Column 'base_sha' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"base_sha"}}},{"@type":"cr:Field","@id":"kt/head_sha","name":"kt/head_sha","description":"Column 'head_sha' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"head_sha"}}},{"@type":"cr:Field","@id":"kt/diff_url","name":"kt/diff_url","description":"Column 'diff_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"diff_url"}}},{"@type":"cr:Field","@id":"kt/diff","name":"kt/diff","description":"Column 'diff' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"diff"}}},{"@type":"cr:Field","@id":"kt/changed_files","name":"kt/changed_files","description":"Column 'changed_files' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_files"}}},{"@type":"cr:Field","@id":"kt/changed_files_exts","name":"kt/changed_files_exts","description":"Column 'changed_files_exts' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_files_exts"}}},{"@type":"cr:Field","@id":"kt/changed_files_count","name":"kt/changed_files_count","description":"Column 'changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_files_count"}}},{"@type":"cr:Field","@id":"kt/java_changed_files_count","name":"kt/java_changed_files_count","description":"Column 'java_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"java_changed_files_count"}}},{"@type":"cr:Field","@id":"kt/kt_changed_files_count","name":"kt/kt_changed_files_count","description":"Column 'kt_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"kt_changed_files_count"}}},{"@type":"cr:Field","@id":"kt/py_changed_files_count","name":"kt/py_changed_files_count","description":"Column 'py_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"py_changed_files_count"}}},{"@type":"cr:Field","@id":"kt/code_changed_files_count","name":"kt/code_changed_files_count","description":"Column 'code_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"code_changed_files_count"}}},{"@type":"cr:Field","@id":"kt/repo_symbols_count","name":"kt/repo_symbols_count","description":"Column 'repo_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_symbols_count"}}},{"@type":"cr:Field","@id":"kt/repo_tokens_count","name":"kt/repo_tokens_count","description":"Column 'repo_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_tokens_count"}}},{"@type":"cr:Field","@id":"kt/repo_lines_count","name":"kt/repo_lines_count","description":"Column 'repo_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_lines_count"}}},{"@type":"cr:Field","@id":"kt/repo_files_without_tests_count","name":"kt/repo_files_without_tests_count","description":"Column 'repo_files_without_tests_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_files_without_tests_count"}}},{"@type":"cr:Field","@id":"kt/changed_symbols_count","name":"kt/changed_symbols_count","description":"Column 'changed_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_symbols_count"}}},{"@type":"cr:Field","@id":"kt/changed_tokens_count","name":"kt/changed_tokens_count","description":"Column 'changed_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_tokens_count"}}},{"@type":"cr:Field","@id":"kt/changed_lines_count","name":"kt/changed_lines_count","description":"Column 'changed_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_lines_count"}}},{"@type":"cr:Field","@id":"kt/changed_files_without_tests_count","name":"kt/changed_files_without_tests_count","description":"Column 'changed_files_without_tests_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"changed_files_without_tests_count"}}},{"@type":"cr:Field","@id":"kt/issue_symbols_count","name":"kt/issue_symbols_count","description":"Column 'issue_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_symbols_count"}}},{"@type":"cr:Field","@id":"kt/issue_words_count","name":"kt/issue_words_count","description":"Column 'issue_words_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_words_count"}}},{"@type":"cr:Field","@id":"kt/issue_tokens_count","name":"kt/issue_tokens_count","description":"Column 'issue_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_tokens_count"}}},{"@type":"cr:Field","@id":"kt/issue_lines_count","name":"kt/issue_lines_count","description":"Column 'issue_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_lines_count"}}},{"@type":"cr:Field","@id":"kt/issue_links_count","name":"kt/issue_links_count","description":"Column 'issue_links_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_links_count"}}},{"@type":"cr:Field","@id":"kt/issue_code_blocks_count","name":"kt/issue_code_blocks_count","description":"Column 'issue_code_blocks_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"issue_code_blocks_count"}}},{"@type":"cr:Field","@id":"kt/repo_stars","name":"kt/repo_stars","description":"Column 'repo_stars' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_stars"}}},{"@type":"cr:Field","@id":"kt/repo_language","name":"kt/repo_language","description":"Column 'repo_language' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_language"}}},{"@type":"cr:Field","@id":"kt/repo_languages","name":"kt/repo_languages","description":"Column 'repo_languages' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_languages"}}},{"@type":"cr:Field","@id":"kt/repo_license","name":"kt/repo_license","description":"Column 'repo_license' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-kt"},"extract":{"column":"repo_license"}}}]},{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"py_splits/split_name"},"@id":"py_splits","name":"py_splits","description":"Splits for the py config.","field":[{"@type":"cr:Field","@id":"py_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"py_splits/split_name":"dev"},{"py_splits/split_name":"test"},{"py_splits/split_name":"train"}]},{"@type":"cr:RecordSet","@id":"py","name":"py","description":"JetBrains-Research/lca-bug-localization - 'py' subset\n\nAdditional information:\n- 3 splits: dev, test, train\n- 1 skipped column: pull_create_at","field":[{"@type":"cr:Field","@id":"py/split","name":"py/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"py/(?:partial-)?(dev|test|train)/.+parquet$"}},"references":{"field":{"@id":"py_splits/split_name"}}},{"@type":"cr:Field","@id":"py/id","name":"py/id","description":"Column 'id' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"id"}}},{"@type":"cr:Field","@id":"py/text_id","name":"py/text_id","description":"Column 'text_id' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"text_id"}}},{"@type":"cr:Field","@id":"py/repo_owner","name":"py/repo_owner","description":"Column 'repo_owner' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_owner"}}},{"@type":"cr:Field","@id":"py/repo_name","name":"py/repo_name","description":"Column 'repo_name' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_name"}}},{"@type":"cr:Field","@id":"py/issue_url","name":"py/issue_url","description":"Column 'issue_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_url"}}},{"@type":"cr:Field","@id":"py/pull_url","name":"py/pull_url","description":"Column 'pull_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"pull_url"}}},{"@type":"cr:Field","@id":"py/comment_url","name":"py/comment_url","description":"Column 'comment_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"comment_url"}}},{"@type":"cr:Field","@id":"py/links_count","name":"py/links_count","description":"Column 'links_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"links_count"}}},{"@type":"cr:Field","@id":"py/link_keyword","name":"py/link_keyword","description":"Column 'link_keyword' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"link_keyword"}}},{"@type":"cr:Field","@id":"py/issue_title","name":"py/issue_title","description":"Column 'issue_title' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_title"}}},{"@type":"cr:Field","@id":"py/issue_body","name":"py/issue_body","description":"Column 'issue_body' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_body"}}},{"@type":"cr:Field","@id":"py/base_sha","name":"py/base_sha","description":"Column 'base_sha' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"base_sha"}}},{"@type":"cr:Field","@id":"py/head_sha","name":"py/head_sha","description":"Column 'head_sha' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"head_sha"}}},{"@type":"cr:Field","@id":"py/diff_url","name":"py/diff_url","description":"Column 'diff_url' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"diff_url"}}},{"@type":"cr:Field","@id":"py/diff","name":"py/diff","description":"Column 'diff' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"diff"}}},{"@type":"cr:Field","@id":"py/changed_files","name":"py/changed_files","description":"Column 'changed_files' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_files"}}},{"@type":"cr:Field","@id":"py/changed_files_exts","name":"py/changed_files_exts","description":"Column 'changed_files_exts' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_files_exts"}}},{"@type":"cr:Field","@id":"py/changed_files_count","name":"py/changed_files_count","description":"Column 'changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_files_count"}}},{"@type":"cr:Field","@id":"py/java_changed_files_count","name":"py/java_changed_files_count","description":"Column 'java_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"java_changed_files_count"}}},{"@type":"cr:Field","@id":"py/kt_changed_files_count","name":"py/kt_changed_files_count","description":"Column 'kt_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"kt_changed_files_count"}}},{"@type":"cr:Field","@id":"py/py_changed_files_count","name":"py/py_changed_files_count","description":"Column 'py_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"py_changed_files_count"}}},{"@type":"cr:Field","@id":"py/code_changed_files_count","name":"py/code_changed_files_count","description":"Column 'code_changed_files_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"code_changed_files_count"}}},{"@type":"cr:Field","@id":"py/repo_symbols_count","name":"py/repo_symbols_count","description":"Column 'repo_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_symbols_count"}}},{"@type":"cr:Field","@id":"py/repo_tokens_count","name":"py/repo_tokens_count","description":"Column 'repo_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_tokens_count"}}},{"@type":"cr:Field","@id":"py/repo_lines_count","name":"py/repo_lines_count","description":"Column 'repo_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_lines_count"}}},{"@type":"cr:Field","@id":"py/repo_files_without_tests_count","name":"py/repo_files_without_tests_count","description":"Column 'repo_files_without_tests_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_files_without_tests_count"}}},{"@type":"cr:Field","@id":"py/changed_symbols_count","name":"py/changed_symbols_count","description":"Column 'changed_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_symbols_count"}}},{"@type":"cr:Field","@id":"py/changed_tokens_count","name":"py/changed_tokens_count","description":"Column 'changed_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_tokens_count"}}},{"@type":"cr:Field","@id":"py/changed_lines_count","name":"py/changed_lines_count","description":"Column 'changed_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_lines_count"}}},{"@type":"cr:Field","@id":"py/changed_files_without_tests_count","name":"py/changed_files_without_tests_count","description":"Column 'changed_files_without_tests_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"changed_files_without_tests_count"}}},{"@type":"cr:Field","@id":"py/issue_symbols_count","name":"py/issue_symbols_count","description":"Column 'issue_symbols_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_symbols_count"}}},{"@type":"cr:Field","@id":"py/issue_words_count","name":"py/issue_words_count","description":"Column 'issue_words_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_words_count"}}},{"@type":"cr:Field","@id":"py/issue_tokens_count","name":"py/issue_tokens_count","description":"Column 'issue_tokens_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_tokens_count"}}},{"@type":"cr:Field","@id":"py/issue_lines_count","name":"py/issue_lines_count","description":"Column 'issue_lines_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_lines_count"}}},{"@type":"cr:Field","@id":"py/issue_links_count","name":"py/issue_links_count","description":"Column 'issue_links_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_links_count"}}},{"@type":"cr:Field","@id":"py/issue_code_blocks_count","name":"py/issue_code_blocks_count","description":"Column 'issue_code_blocks_count' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"issue_code_blocks_count"}}},{"@type":"cr:Field","@id":"py/repo_stars","name":"py/repo_stars","description":"Column 'repo_stars' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_stars"}}},{"@type":"cr:Field","@id":"py/repo_language","name":"py/repo_language","description":"Column 'repo_language' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_language"}}},{"@type":"cr:Field","@id":"py/repo_languages","name":"py/repo_languages","description":"Column 'repo_languages' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_languages"}}},{"@type":"cr:Field","@id":"py/repo_license","name":"py/repo_license","description":"Column 'repo_license' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-py"},"extract":{"column":"repo_license"}}}]}],"conformsTo":"http://mlcommons.org/croissant/1.0","name":"lca-bug-localization","identifier":"10.57967/hf/2514","description":"\n\t\n\t\t\n\t\t🏟️ Long Code Arena (Bug localization)\n\t\n\nThis is the benchmark for the Bug localization task as part of the\n🏟️ Long Code Arena benchmark.\nThe bug localization problem can be formulated as follows: given an issue with a bug description and a repository snapshot in a state where the bug is reproducible, identify the files within the repository that need to be modified to address the reported bug.\nThe dataset provides all the required components for evaluation of bug localization… See the full description on the dataset page: https://huggingface.co/datasets/JetBrains-Research/lca-bug-localization.","alternateName":["JetBrains-Research/lca-bug-localization","LCA (Bug Localization)"],"creator":{"@type":"Organization","name":"JetBrains Research","url":"https://huggingface.co/JetBrains-Research"},"keywords":["text-generation","English","apache-2.0","10K - 100K","parquet","Image","Tabular","Text","Datasets","pandas","Croissant","Polars","arxiv:2406.11612","doi:10.57967/hf/2514","🇺🇸 Region: US","code"],"license":"https://choosealicense.com/licenses/apache-2.0/","url":"https://huggingface.co/datasets/JetBrains-Research/lca-bug-localization"}