| { | |
| "algorithm": { | |
| "command": null, | |
| "id": 4, | |
| "name": "Gensim Continuous Bag-of-Words", | |
| "tool": "Gensim", | |
| "url": "https://github.com/RaRe-Technologies/gensim", | |
| "version": "3.6" | |
| }, | |
| "contents": [ | |
| { | |
| "filename": "model.txt", | |
| "format": "text" | |
| }, | |
| { | |
| "filename": "model.bin", | |
| "format": "data" | |
| }, | |
| { | |
| "filename": "meta.json", | |
| "format": "json" | |
| } | |
| ], | |
| "corpus": [ | |
| { | |
| "NER": false, | |
| "case preserved": false, | |
| "description": "Oil and Gas corpus", | |
| "id": 75, | |
| "language": "eng", | |
| "lemmatized": true, | |
| "license": "proprietary", | |
| "public": false, | |
| "stop words removal": "NLTK", | |
| "tagger": "Stanford Core NLP v. 3.6.0", | |
| "tagset": null, | |
| "tokens": 108000000, | |
| "tool": null, | |
| "url": null | |
| } | |
| ], | |
| "creators": [ | |
| { | |
| "email": "farhadno@ifi.uio.no", | |
| "name": "Farhad Nooralahzadeh" | |
| } | |
| ], | |
| "dimensions": 400, | |
| "handle": "http://vectors.nlpl.eu/repository/20/75.zip", | |
| "id": 75, | |
| "iterations": 5, | |
| "vocabulary size": 285055, | |
| "window": 5 | |
| } |