{"total_documents": 8355, "words_document_mean": 5.91, "vocabulary_length": 1696, "last-training-doc": 5847, "last-validation-doc": 7101, "preprocessing-info": "Steps:\n  remove_punctuation\n  lemmatization\n  remove_stopwords\n  filter_words\n  remove_docs\nParameters:\n  removed words with less than 0.0005 or more than 1 documents with an occurrence of the word in corpus\n  removed documents with less than 3 words", "info": {"name": "CiteSeer-M10", "link": "https://github.com/shiruipan/TriDNR", "source": "https://github.com/shiruipan/TriDNR", "paper": "https://www.ijcai.org/Proceedings/16/Papers/271.pdf", "citation": "@inproceedings{DBLP:conf/ijcai/PanWZZW16,\n  author    = {Shirui Pan and\n               Jia Wu and\n               Xingquan Zhu and\n               Chengqi Zhang and\n               Yang Wang},\n  editor    = {Subbarao Kambhampati},\n  title     = {Tri-Party Deep Network Representation},\n  booktitle = {Proceedings of the Twenty-Fifth International Joint Conference on\n               Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July\n               2016},\n  pages     = {1895--1901},\n  publisher = {{IJCAI/AAAI} Press},\n  year      = {2016},\n  url       = {http://www.ijcai.org/Abstract/16/271},\n  timestamp = {Tue, 20 Aug 2019 16:19:21 +0200},\n  biburl    = {https://dblp.org/rec/conf/ijcai/PanWZZW16.bib},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}"}, "labels": ["0", "1", "2", "3", "4", "5", "6", "7", "8", "9"], "total_labels": 10}