{"@context":{"@language":"en","@vocab":"https://schema.org/","citeAs":"cr:citeAs","column":"cr:column","conformsTo":"dct:conformsTo","cr":"http://mlcommons.org/croissant/","data":{"@id":"cr:data","@type":"@json"},"dataBiases":"cr:dataBiases","dataCollection":"cr:dataCollection","dataType":{"@id":"cr:dataType","@type":"@vocab"},"dct":"http://purl.org/dc/terms/","extract":"cr:extract","field":"cr:field","fileProperty":"cr:fileProperty","fileObject":"cr:fileObject","fileSet":"cr:fileSet","format":"cr:format","includes":"cr:includes","isLiveDataset":"cr:isLiveDataset","jsonPath":"cr:jsonPath","key":"cr:key","md5":"cr:md5","parentField":"cr:parentField","path":"cr:path","personalSensitiveInformation":"cr:personalSensitiveInformation","recordSet":"cr:recordSet","references":"cr:references","regex":"cr:regex","repeated":"cr:repeated","replace":"cr:replace","sc":"https://schema.org/","separator":"cr:separator","source":"cr:source","subField":"cr:subField","transform":"cr:transform"},"@type":"sc:Dataset","distribution":[{"@type":"cr:FileObject","@id":"repo","name":"repo","description":"The Hugging Face git repository.","contentUrl":"https://huggingface.co/datasets/JetBrains-Research/lca-project-level-code-completion/tree/refs%2Fconvert%2Fparquet","encodingFormat":"git+https","sha256":"https://github.com/mlcommons/croissant/issues/80"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-huge_context","name":"parquet-files-for-config-huge_context","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"huge_context/*/*.parquet"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-large_context","name":"parquet-files-for-config-large_context","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"large_context/*/*.parquet"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-medium_context","name":"parquet-files-for-config-medium_context","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"medium_context/*/*.parquet"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-small_context","name":"parquet-files-for-config-small_context","description":"The underlying Parquet files as converted by Hugging Face (see: https://huggingface.co/docs/dataset-viewer/parquet).","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"small_context/*/*.parquet"}],"recordSet":[{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"huge_context_splits/split_name"},"@id":"huge_context_splits","name":"huge_context_splits","description":"Splits for the huge_context config.","field":[{"@type":"cr:Field","@id":"huge_context_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"huge_context_splits/split_name":"test"}]},{"@type":"cr:RecordSet","@id":"huge_context","name":"huge_context","description":"JetBrains-Research/lca-project-level-code-completion - 'huge_context' subset (first 5GB)","field":[{"@type":"cr:Field","@id":"huge_context/split","name":"huge_context/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"huge_context/(?:partial-)?(test)/.+parquet$"}},"references":{"field":{"@id":"huge_context_splits/split_name"}}},{"@type":"cr:Field","@id":"huge_context/repo","name":"huge_context/repo","description":"Column 'repo' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"repo"}}},{"@type":"cr:Field","@id":"huge_context/commit_hash","name":"huge_context/commit_hash","description":"Column 'commit_hash' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"commit_hash"}}},{"@type":"cr:Field","@id":"huge_context/completion_file","name":"huge_context/completion_file","description":"Column 'completion_file' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"huge_context/completion_file/filename","name":"huge_context/completion_file/filename","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"huge_context/completion_file/content","name":"huge_context/completion_file/content","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"content"}}}]},{"@type":"cr:Field","@id":"huge_context/completion_lines","name":"huge_context/completion_lines","description":"Column 'completion_lines' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"huge_context/completion_lines/commited","name":"huge_context/completion_lines/commited","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines/common","name":"huge_context/completion_lines/common","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines/infile","name":"huge_context/completion_lines/infile","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines/inproject","name":"huge_context/completion_lines/inproject","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines/non_informative","name":"huge_context/completion_lines/non_informative","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines/random","name":"huge_context/completion_lines/random","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines"}},"repeated":true}]},{"@type":"cr:Field","@id":"huge_context/repo_snapshot","name":"huge_context/repo_snapshot","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"huge_context/repo_snapshot/filename","name":"huge_context/repo_snapshot/filename","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"huge_context/repo_snapshot/content","name":"huge_context/repo_snapshot/content","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"content"}}}],"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines_raw","name":"huge_context/completion_lines_raw","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"huge_context/completion_lines_raw/commited","name":"huge_context/completion_lines_raw/commited","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines_raw/common","name":"huge_context/completion_lines_raw/common","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines_raw/infile","name":"huge_context/completion_lines_raw/infile","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines_raw/inproject","name":"huge_context/completion_lines_raw/inproject","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines_raw/non_informative","name":"huge_context/completion_lines_raw/non_informative","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"huge_context/completion_lines_raw/other","name":"huge_context/completion_lines_raw/other","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-huge_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true}]}]},{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"large_context_splits/split_name"},"@id":"large_context_splits","name":"large_context_splits","description":"Splits for the large_context config.","field":[{"@type":"cr:Field","@id":"large_context_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"large_context_splits/split_name":"test"}]},{"@type":"cr:RecordSet","@id":"large_context","name":"large_context","description":"JetBrains-Research/lca-project-level-code-completion - 'large_context' subset (first 5GB)","field":[{"@type":"cr:Field","@id":"large_context/split","name":"large_context/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"large_context/(?:partial-)?(test)/.+parquet$"}},"references":{"field":{"@id":"large_context_splits/split_name"}}},{"@type":"cr:Field","@id":"large_context/repo","name":"large_context/repo","description":"Column 'repo' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"repo"}}},{"@type":"cr:Field","@id":"large_context/commit_hash","name":"large_context/commit_hash","description":"Column 'commit_hash' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"commit_hash"}}},{"@type":"cr:Field","@id":"large_context/completion_file","name":"large_context/completion_file","description":"Column 'completion_file' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"large_context/completion_file/filename","name":"large_context/completion_file/filename","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"large_context/completion_file/content","name":"large_context/completion_file/content","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"content"}}}]},{"@type":"cr:Field","@id":"large_context/completion_lines","name":"large_context/completion_lines","description":"Column 'completion_lines' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"large_context/completion_lines/commited","name":"large_context/completion_lines/commited","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines/common","name":"large_context/completion_lines/common","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines/infile","name":"large_context/completion_lines/infile","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines/inproject","name":"large_context/completion_lines/inproject","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines/non_informative","name":"large_context/completion_lines/non_informative","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines/random","name":"large_context/completion_lines/random","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines"}},"repeated":true}]},{"@type":"cr:Field","@id":"large_context/repo_snapshot","name":"large_context/repo_snapshot","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"large_context/repo_snapshot/filename","name":"large_context/repo_snapshot/filename","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"large_context/repo_snapshot/content","name":"large_context/repo_snapshot/content","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"content"}}}],"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines_raw","name":"large_context/completion_lines_raw","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"large_context/completion_lines_raw/commited","name":"large_context/completion_lines_raw/commited","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines_raw/common","name":"large_context/completion_lines_raw/common","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines_raw/infile","name":"large_context/completion_lines_raw/infile","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines_raw/inproject","name":"large_context/completion_lines_raw/inproject","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines_raw/non_informative","name":"large_context/completion_lines_raw/non_informative","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"large_context/completion_lines_raw/other","name":"large_context/completion_lines_raw/other","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-large_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true}]}]},{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"medium_context_splits/split_name"},"@id":"medium_context_splits","name":"medium_context_splits","description":"Splits for the medium_context config.","field":[{"@type":"cr:Field","@id":"medium_context_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"medium_context_splits/split_name":"test"}]},{"@type":"cr:RecordSet","@id":"medium_context","name":"medium_context","description":"JetBrains-Research/lca-project-level-code-completion - 'medium_context' subset (first 5GB)","field":[{"@type":"cr:Field","@id":"medium_context/split","name":"medium_context/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"medium_context/(?:partial-)?(test)/.+parquet$"}},"references":{"field":{"@id":"medium_context_splits/split_name"}}},{"@type":"cr:Field","@id":"medium_context/repo","name":"medium_context/repo","description":"Column 'repo' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"repo"}}},{"@type":"cr:Field","@id":"medium_context/commit_hash","name":"medium_context/commit_hash","description":"Column 'commit_hash' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"commit_hash"}}},{"@type":"cr:Field","@id":"medium_context/completion_file","name":"medium_context/completion_file","description":"Column 'completion_file' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"medium_context/completion_file/filename","name":"medium_context/completion_file/filename","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"medium_context/completion_file/content","name":"medium_context/completion_file/content","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"content"}}}]},{"@type":"cr:Field","@id":"medium_context/completion_lines","name":"medium_context/completion_lines","description":"Column 'completion_lines' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"medium_context/completion_lines/commited","name":"medium_context/completion_lines/commited","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines/common","name":"medium_context/completion_lines/common","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines/infile","name":"medium_context/completion_lines/infile","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines/inproject","name":"medium_context/completion_lines/inproject","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines/non_informative","name":"medium_context/completion_lines/non_informative","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines/random","name":"medium_context/completion_lines/random","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines"}},"repeated":true}]},{"@type":"cr:Field","@id":"medium_context/repo_snapshot","name":"medium_context/repo_snapshot","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"medium_context/repo_snapshot/filename","name":"medium_context/repo_snapshot/filename","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"medium_context/repo_snapshot/content","name":"medium_context/repo_snapshot/content","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"content"}}}],"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines_raw","name":"medium_context/completion_lines_raw","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"medium_context/completion_lines_raw/commited","name":"medium_context/completion_lines_raw/commited","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines_raw/common","name":"medium_context/completion_lines_raw/common","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines_raw/infile","name":"medium_context/completion_lines_raw/infile","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines_raw/inproject","name":"medium_context/completion_lines_raw/inproject","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines_raw/non_informative","name":"medium_context/completion_lines_raw/non_informative","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"medium_context/completion_lines_raw/other","name":"medium_context/completion_lines_raw/other","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-medium_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true}]}]},{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"small_context_splits/split_name"},"@id":"small_context_splits","name":"small_context_splits","description":"Splits for the small_context config.","field":[{"@type":"cr:Field","@id":"small_context_splits/split_name","name":"split_name","description":"The name of the split.","dataType":"sc:Text"}],"data":[{"small_context_splits/split_name":"test"}]},{"@type":"cr:RecordSet","@id":"small_context","name":"small_context","description":"JetBrains-Research/lca-project-level-code-completion - 'small_context' subset (first 5GB)","field":[{"@type":"cr:Field","@id":"small_context/split","name":"small_context/split","description":"Split to which the example belongs to.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"small_context/(?:partial-)?(test)/.+parquet$"}},"references":{"field":{"@id":"small_context_splits/split_name"}}},{"@type":"cr:Field","@id":"small_context/repo","name":"small_context/repo","description":"Column 'repo' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"repo"}}},{"@type":"cr:Field","@id":"small_context/commit_hash","name":"small_context/commit_hash","description":"Column 'commit_hash' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"commit_hash"}}},{"@type":"cr:Field","@id":"small_context/completion_file","name":"small_context/completion_file","description":"Column 'completion_file' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"small_context/completion_file/filename","name":"small_context/completion_file/filename","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"small_context/completion_file/content","name":"small_context/completion_file/content","description":"Column 'completion_file' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_file"},"transform":{"jsonPath":"content"}}}]},{"@type":"cr:Field","@id":"small_context/completion_lines","name":"small_context/completion_lines","description":"Column 'completion_lines' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"small_context/completion_lines/commited","name":"small_context/completion_lines/commited","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines/common","name":"small_context/completion_lines/common","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines/infile","name":"small_context/completion_lines/infile","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines/inproject","name":"small_context/completion_lines/inproject","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines/non_informative","name":"small_context/completion_lines/non_informative","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines/random","name":"small_context/completion_lines/random","description":"Column 'completion_lines' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines"}},"repeated":true}]},{"@type":"cr:Field","@id":"small_context/repo_snapshot","name":"small_context/repo_snapshot","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"small_context/repo_snapshot/filename","name":"small_context/repo_snapshot/filename","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"filename"}}},{"@type":"cr:Field","@id":"small_context/repo_snapshot/content","name":"small_context/repo_snapshot/content","description":"Column 'repo_snapshot' from the Hugging Face parquet file.","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"repo_snapshot"},"transform":{"jsonPath":"content"}}}],"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines_raw","name":"small_context/completion_lines_raw","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","subField":[{"@type":"cr:Field","@id":"small_context/completion_lines_raw/commited","name":"small_context/completion_lines_raw/commited","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines_raw/common","name":"small_context/completion_lines_raw/common","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines_raw/infile","name":"small_context/completion_lines_raw/infile","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines_raw/inproject","name":"small_context/completion_lines_raw/inproject","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines_raw/non_informative","name":"small_context/completion_lines_raw/non_informative","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true},{"@type":"cr:Field","@id":"small_context/completion_lines_raw/other","name":"small_context/completion_lines_raw/other","description":"Column 'completion_lines_raw' from the Hugging Face parquet file.","dataType":"sc:Integer","source":{"fileSet":{"@id":"parquet-files-for-config-small_context"},"extract":{"column":"completion_lines_raw"}},"repeated":true}]}]}],"conformsTo":"http://mlcommons.org/croissant/1.0","name":"lca-project-level-code-completion","identifier":"10.57967/hf/2512","description":"\n\t\n\t\t\n\t\t🏟️ Long Code Arena (Project-level code completion)\n\t\n\nThis is the benchmark for Project-level code completion task as part of the 🏟️ Long Code Arena benchmark.\nEach datapoint contains the file for completion, a list of lines to complete with their categories (see the categorization below), and a repository snapshot that can be used to build the context.\nAll the repositories are published under permissive licenses (MIT, Apache-2.0, BSD-3-Clause, and BSD-2-Clause). The datapoints can… See the full description on the dataset page: https://huggingface.co/datasets/JetBrains-Research/lca-project-level-code-completion.","alternateName":["JetBrains-Research/lca-project-level-code-completion"],"creator":{"@type":"Organization","name":"JetBrains Research","url":"https://huggingface.co/JetBrains-Research"},"keywords":["apache-2.0","< 1K","parquet","Text","Datasets","Dask","Croissant","Polars","arxiv:2406.11612","doi:10.57967/hf/2512","🇺🇸 Region: US"],"license":"https://choosealicense.com/licenses/apache-2.0/","url":"https://huggingface.co/datasets/JetBrains-Research/lca-project-level-code-completion"}