WiktionaryDumps to words: Difference between revisions
Content added Content deleted
(→{{header|OCaml}}: Fixed regexp) |
(Updated output) |
||
Line 74: | Line 74: | ||
$ wget --quiet https://dumps.wikimedia.org/enwiktionary/latest/enwiktionary-latest-pages-articles.xml.bz2 -O - | bzcat | \ |
$ wget --quiet https://dumps.wikimedia.org/enwiktionary/latest/enwiktionary-latest-pages-articles.xml.bz2 -O - | bzcat | \ |
||
java WiktoWords |
java WiktoWords |
||
gratis |
|||
hélice |
|||
gratuit |
|||
pingouin |
|||
livre |
|||
égoïsme |
|||
chien |
|||
écholocation |
|||
pond |
|||
nitroglycérine |
|||
pies |
|||
croque-mitaine |
|||
pie |
|||
A |
|||
connotation |
|||
minute |
|||
... |
|||
</pre> |
</pre> |
||
Line 126: | Line 131: | ||
wget --quiet https://dumps.wikimedia.org/enwiktionary/latest/enwiktionary-latest-pages-articles.xml.bz2 -O - | bzcat | \ |
wget --quiet https://dumps.wikimedia.org/enwiktionary/latest/enwiktionary-latest-pages-articles.xml.bz2 -O - | bzcat | \ |
||
ocaml str.cma -I $(ocamlfind query xmlm) xmlm.cma to_words.ml |
ocaml str.cma -I $(ocamlfind query xmlm) xmlm.cma to_words.ml |
||
gratis |
|||
livrer |
|||
gratuit |
|||
observateur |
|||
livre |
|||
qui a bu boira |
|||
chien |
|||
quelque chose |
|||
pond |
|||
grande parure |
|||
pies |
|||
obiit |
|||
pie |
|||
pleuvoir |
|||
A |
|||
voir |
|||
connotation |
|||
minute |
|||
... |
... |
||
</pre> |
</pre> |