{ | |
"algorithm": { | |
"command": null, | |
"id": 4, | |
"name": "Gensim Continuous Bag-of-Words", | |
"tool": "Gensim", | |
"url": "https://github.com/RaRe-Technologies/gensim", | |
"version": "3.6" | |
}, | |
"contents": [ | |
{ | |
"filename": "model.txt", | |
"format": "text" | |
}, | |
{ | |
"filename": "model.bin", | |
"format": "data" | |
}, | |
{ | |
"filename": "meta.json", | |
"format": "json" | |
} | |
], | |
"corpus": [ | |
{ | |
"NER": false, | |
"case preserved": false, | |
"description": "Oil and Gas corpus", | |
"id": 75, | |
"language": "eng", | |
"lemmatized": true, | |
"license": "proprietary", | |
"public": false, | |
"stop words removal": "NLTK", | |
"tagger": "Stanford Core NLP v. 3.6.0", | |
"tagset": null, | |
"tokens": 108000000, | |
"tool": null, | |
"url": null | |
} | |
], | |
"creators": [ | |
{ | |
"email": "farhadno@ifi.uio.no", | |
"name": "Farhad Nooralahzadeh" | |
} | |
], | |
"dimensions": 400, | |
"handle": "http://vectors.nlpl.eu/repository/20/75.zip", | |
"id": 75, | |
"iterations": 5, | |
"vocabulary size": 285055, | |
"window": 5 | |
} |