|
|
@@ -6,7 +6,7 @@
|
|
|
|
|
|
ga('create', 'UA-44373548-30', 'auto');
|
|
|
ga('send', 'pageview');
|
|
|
- </script><link rel="stylesheet" href="/css/main.css"/></head><body class="sideNavVisible"><div class="fixedHeaderContainer"><div class="headerWrapper wrapper"><header><a href="/"><img class="logo" src="/img/fasttext-icon-white-web.png" alt="fastText"/></a><div class="navigationWrapper navigationSlider"><nav class="slidingNav"><ul class="nav-site nav-site-internal"><li class=""><a href="/docs/en/support.html" target="_self">Docs</a></li><li class="siteNavGroupActive"><a href="/docs/en/english-vectors.html" target="_self">Download</a></li><li class=""><a href="/blog" target="_self">Blog</a></li><li class=""><a href="https://github.com/facebookresearch/fastText/" target="_blank">GitHub</a></li></ul></nav></div></header></div></div><div class="navPusher"><div class="docMainWrapper wrapper"><div class="container docsNavContainer" id="docsNav"><nav class="toc"><div class="toggleNav"><section class="navWrapper wrapper"><div class="navBreadcrumb wrapper"><div class="navToggle" id="navToggler"><i></i></div><h2><i>›</i><span>Download</span></h2></div><div class="navGroups"><div class="navGroup"><h3 class="navGroupCategoryTitle">Download</h3><ul><li class="navListItem"><a class="navItem" href="/docs/en/english-vectors.html">English word vectors</a></li><li class="navListItem navListItemActive"><a class="navItem" href="/docs/en/crawl-vectors.html">Word vectors for 157 languages</a></li><li class="navListItem"><a class="navItem" href="/docs/en/pretrained-vectors.html">Wiki word vectors</a></li><li class="navListItem"><a class="navItem" href="/docs/en/aligned-vectors.html">Aligned word vectors</a></li><li class="navListItem"><a class="navItem" href="/docs/en/supervised-models.html">Supervised models</a></li><li class="navListItem"><a class="navItem" href="/docs/en/language-identification.html">Language identification</a></li><li class="navListItem"><a class="navItem" href="/docs/en/dataset.html">Datasets</a></li></ul></div></div></section></div><script>
|
|
|
+ </script><link rel="stylesheet" href="/css/main.css"/></head><body class="sideNavVisible"><div class="fixedHeaderContainer"><div class="headerWrapper wrapper"><header><a href="/"><img class="logo" src="/img/fasttext-icon-white-web.png" alt="fastText"/></a><div class="navigationWrapper navigationSlider"><nav class="slidingNav"><ul class="nav-site nav-site-internal"><li class=""><a href="/docs/en/support.html" target="_self">Docs</a></li><li class="siteNavGroupActive"><a href="/docs/en/english-vectors.html" target="_self">Download</a></li><li class=""><a href="/blog/" target="_self">Blog</a></li><li class=""><a href="https://github.com/facebookresearch/fastText/" target="_blank">GitHub</a></li></ul></nav></div></header></div></div><div class="navPusher"><div class="docMainWrapper wrapper"><div class="container docsNavContainer" id="docsNav"><nav class="toc"><div class="toggleNav"><section class="navWrapper wrapper"><div class="navBreadcrumb wrapper"><div class="navToggle" id="navToggler"><i></i></div><h2><i>›</i><span>Download</span></h2></div><div class="navGroups"><div class="navGroup"><h3 class="navGroupCategoryTitle">Download</h3><ul><li class="navListItem"><a class="navItem" href="/docs/en/english-vectors.html">English word vectors</a></li><li class="navListItem navListItemActive"><a class="navItem" href="/docs/en/crawl-vectors.html">Word vectors for 157 languages</a></li><li class="navListItem"><a class="navItem" href="/docs/en/pretrained-vectors.html">Wiki word vectors</a></li><li class="navListItem"><a class="navItem" href="/docs/en/aligned-vectors.html">Aligned word vectors</a></li><li class="navListItem"><a class="navItem" href="/docs/en/supervised-models.html">Supervised models</a></li><li class="navListItem"><a class="navItem" href="/docs/en/language-identification.html">Language identification</a></li><li class="navListItem"><a class="navItem" href="/docs/en/dataset.html">Datasets</a></li></ul></div></div></section></div><script>
|
|
|
document.addEventListener('DOMContentLoaded', function() {
|
|
|
createToggler('#navToggler', '#docsNav', 'docsSliderActive');
|
|
|
createToggler('#tocToggler', 'body', 'tocActive');
|
|
|
@@ -33,7 +33,7 @@
|
|
|
};
|
|
|
}
|
|
|
});
|
|
|
- </script></nav></div><div class="container mainContainer"><div class="wrapper"><div class="post"><header class="postHeader"><h1 class="postHeaderTitle">Word vectors for 157 languages</h1></header><article><div><span><p>We distribute pre-trained word vectors for 157 languages, trained on <a href="http://commoncrawl.org/"><em>Common Crawl</em></a> and <a href="https://www.wikipedia.org"><em>Wikipedia</em></a> using fastText.
|
|
|
+ </script></nav></div><div class="container mainContainer docMainContainer"><div class="wrapper"><div class="post"><header class="postHeader"><h1 class="postHeaderTitle">Word vectors for 157 languages</h1></header><article><div><span><p>We distribute pre-trained word vectors for 157 languages, trained on <a href="http://commoncrawl.org/"><em>Common Crawl</em></a> and <a href="https://www.wikipedia.org"><em>Wikipedia</em></a> using fastText.
|
|
|
These models were trained using CBOW with position-weights, in dimension 300, with character n-grams of length 5, a window of size 5 and 10 negatives.
|
|
|
We also distribute three new word analogy datasets, for French, Hindi and Polish.</p>
|
|
|
<h3><a class="anchor" aria-hidden="true" id="format"></a><a href="#format" aria-hidden="true" class="hash-link"><svg class="hash-link-icon" aria-hidden="true" height="16" version="1.1" viewBox="0 0 16 16" width="16"><path fill-rule="evenodd" d="M4 9h1v1H4c-1.5 0-3-1.69-3-3.5S2.55 3 4 3h4c1.45 0 3 1.69 3 3.5 0 1.41-.91 2.72-2 3.25V8.59c.58-.45 1-1.27 1-2.09C10 5.22 8.98 4 8 4H4c-.98 0-2 1.22-2 2.5S3 9 4 9zm9-3h-1v1h1c1 0 2 1.22 2 2.5S13.98 12 13 12H9c-.98 0-2-1.22-2-2.5 0-.83.42-1.64 1-2.09V6.25c-1.09.53-2 1.84-2 3.25C6 11.31 7.55 13 9 13h4c1.45 0 3-1.69 3-3.5S14.5 6 13 6z"></path></svg></a>Format</h3>
|
|
|
@@ -137,4 +137,4 @@ For the remaining languages, we used the ICU tokenizer.</p>
|
|
|
<tr><td>Zazaki: <a href="https://s3-us-west-1.amazonaws.com/fasttext-vectors/word-vectors-v2/cc.diq.300.bin.gz">bin</a>, <a href="https://s3-us-west-1.amazonaws.com/fasttext-vectors/word-vectors-v2/cc.diq.300.vec.gz">text</a></td><td>Zeelandic: <a href="https://s3-us-west-1.amazonaws.com/fasttext-vectors/word-vectors-v2/cc.zea.300.bin.gz">bin</a>, <a href="https://s3-us-west-1.amazonaws.com/fasttext-vectors/word-vectors-v2/cc.zea.300.vec.gz">text</a></td></tr>
|
|
|
</tbody>
|
|
|
</table>
|
|
|
-</span></div></article></div><div class="docs-prevnext"><a class="docs-prev button" href="/docs/en/english-vectors.html">← English word vectors</a><a class="docs-next button" href="/docs/en/pretrained-vectors.html">Wiki word vectors →</a></div></div></div></div><footer class="nav-footer" id="footer"><section class="sitemap"><a href="/" class="nav-home"><img src="/img/fasttext-icon-white-web.png" alt="fastText"/></a><div><h5>Support</h5><a href="/docs/en/support.html">Getting Started</a><a href="/docs/en/supervised-tutorial.html">Tutorials</a><a href="/docs/en/faqs.html">FAQs</a><a href="/docs/en/api.html">API</a></div><div><h5>Community</h5><a href="https://www.facebook.com/groups/1174547215919768/" target="_blank">Facebook Group</a><a href="http://stackoverflow.com/questions/tagged/fasttext" target="_blank">Stack Overflow</a><a href="https://groups.google.com/forum/#!forum/fasttext-library" target="_blank">Google Group</a></div><div><h5>More</h5><a href="/blog">Blog</a><a href="https://github.com/facebookresearch/fastText" target="_blank">GitHub</a><a class="github-button" href="https://github.com/facebookresearch/fastText/" data-icon="octicon-star" data-count-href="/fastText/stargazers" data-count-api="/repos/fastText#stargazers_count" data-count-aria-label="# stargazers on GitHub" aria-label="Star this project on GitHub">Star</a></div></section><a href="https://code.facebook.com/projects/" target="_blank" class="fbOpenSource"><img src="/img/oss_logo.png" alt="Facebook Open Source" width="170" height="45"/></a><section class="copyright">Copyright © 2018 Facebook Inc.</section></footer></div></body></html>
|
|
|
+</span></div></article></div><div class="docs-prevnext"><a class="docs-prev button" href="/docs/en/english-vectors.html"><span class="arrow-prev">← </span><span>Previous</span></a><a class="docs-next button" href="/docs/en/pretrained-vectors.html"><span>Next</span><span class="arrow-next"> →</span></a></div></div></div></div><footer class="nav-footer" id="footer"><section class="sitemap"><a href="/" class="nav-home"><img src="/img/fasttext-icon-white-web.png" alt="fastText"/></a><div><h5>Support</h5><a href="/docs/en/support.html">Getting Started</a><a href="/docs/en/supervised-tutorial.html">Tutorials</a><a href="/docs/en/faqs.html">FAQs</a><a href="/docs/en/api.html">API</a></div><div><h5>Community</h5><a href="https://www.facebook.com/groups/1174547215919768/" target="_blank">Facebook Group</a><a href="http://stackoverflow.com/questions/tagged/fasttext" target="_blank">Stack Overflow</a><a href="https://groups.google.com/forum/#!forum/fasttext-library" target="_blank">Google Group</a></div><div><h5>More</h5><a href="/blog">Blog</a><a href="https://github.com/facebookresearch/fastText" target="_blank">GitHub</a><a class="github-button" href="https://github.com/facebookresearch/fastText/" data-icon="octicon-star" data-count-href="/fastText/stargazers" data-count-api="/repos/fastText#stargazers_count" data-count-aria-label="# stargazers on GitHub" aria-label="Star this project on GitHub">Star</a></div></section><a href="https://code.facebook.com/projects/" target="_blank" class="fbOpenSource"><img src="/img/oss_logo.png" alt="Facebook Open Source" width="170" height="45"/></a><section class="copyright">Copyright © 2018 Facebook Inc.</section></footer></div></body></html>
|