123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111 |
- <?xml version="1.0" encoding="utf-8"?>
- <!--
-
- h t t :: / / t /
- h t t :: // // t //
- h ttttt ttttt ppppp sssss // // y y sssss ttttt //
- hhhh t t p p s // // y y s t //
- h hh t t ppppp sssss // // yyyyy sssss t //
- h h t t p s :: / / y .. s t .. /
- h h t t p sssss :: / / yyyyy .. sssss t .. /
-
- <https://y.st./>
- Copyright © 2015 Alex Yst <mailto:copyright@y.st>
- This program is free software: you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation, either version 3 of the License, or
- (at your option) any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program. If not, see <https://www.gnu.org./licenses/>.
- -->
- <!DOCTYPE html>
- <html xmlns="http://www.w3.org/1999/xhtml">
- <head>
- <base href="https://y.st./en/weblog/2015/11-November/21.xhtml" />
- <title>More word lists for eschalot <https://y.st./en/weblog/2015/11-November/21.xhtml></title>
- <link rel="icon" type="image/png" href="/link/CC_BY-SA_4.0/y.st./icon.png" />
- <link rel="stylesheet" type="text/css" href="/link/basic.css" />
- <link rel="stylesheet" type="text/css" href="/link/site-specific.css" />
- <script type="text/javascript" src="/script/javascript.js" />
- <meta name="viewport" content="width=device-width" />
- </head>
- <body>
- <nav>
- <p>
- <a href="/en/">Home</a> |
- <a href="/en/a/about.xhtml">About</a> |
- <a href="/en/a/contact.xhtml">Contact</a> |
- <a href="/a/canary.txt">Canary</a> |
- <a href="/en/URI_research/"><abbr title="Uniform Resource Identifier">URI</abbr> research</a> |
- <a href="/en/opinion/">Opinions</a> |
- <a href="/en/coursework/">Coursework</a> |
- <a href="/en/law/">Law</a> |
- <a href="/en/a/links.xhtml">Links</a> |
- <a href="/en/weblog/2015/11-November/21.xhtml.asc">{this page}.asc</a>
- </p>
- <hr/>
- <p>
- Weblog index:
- <a href="/en/weblog/"><abbr title="American Standard Code for Information Interchange">ASCII</abbr> calendars</a> |
- <a href="/en/weblog/index_ol_ascending.xhtml">Ascending list</a> |
- <a href="/en/weblog/index_ol_descending.xhtml">Descending list</a>
- </p>
- <hr/>
- <p>
- Jump to entry:
- <a href="/en/weblog/2015/03-March/07.xhtml"><<First</a>
- <a rel="prev" href="/en/weblog/2015/11-November/20.xhtml"><Previous</a>
- <a rel="next" href="/en/weblog/2015/11-November/22.xhtml">Next></a>
- <a href="/en/weblog/latest.xhtml">Latest>></a>
- </p>
- <hr/>
- </nav>
- <header>
- <h1>More word lists for eschalot</h1>
- <p>Day 00259: Saturday, 2015 November 21</p>
- </header>
- <p>
- I spent most of today cleaning, just like yesterday.
- </p>
- <p>
- I took a small break because I had a new idea.
- I should combine the dictionaries provided by Debian for different languages and create a multilingual dictionary to use with eschalot.
- With only a little bit of searching, I found that the relevant packages to install were <a href="apt:miscfiles"><code>miscfiles</code></a>, <a href="apt:wamerican"><code>wamerican</code></a>, <a href="apt:wamerican-huge"><code>wamerican-huge</code></a>, <a href="apt:wamerican-insane"><code>wamerican-insane</code></a>, <a href="apt:wamerican-large"><code>wamerican-large</code></a>, <a href="apt:wamerican-small"><code>wamerican-small</code></a>, <a href="apt:wbrazilian"><code>wbrazilian</code></a>, <a href="apt:wbritish"><code>wbritish</code></a>, <a href="apt:wbritish-huge"><code>wbritish-huge</code></a>, <a href="apt:wbritish-insane"><code>wbritish-insane</code></a>, <a href="apt:wbritish-large"><code>wbritish-large</code></a>, <a href="apt:wbritish-small"><code>wbritish-small</code></a>, <a href="apt:wbulgarian"><code>wbulgarian</code></a>, <a href="apt:wcanadian"><code>wcanadian</code></a>, <a href="apt:wcanadian-huge"><code>wcanadian-huge</code></a>, <a href="apt:wcanadian-insane"><code>wcanadian-insane</code></a>, <a href="apt:wcanadian-large"><code>wcanadian-large</code></a>, <a href="apt:wcanadian-small"><code>wcanadian-small</code></a>, <a href="apt:wcatalan"><code>wcatalan</code></a>, <a href="apt:wdanish"><code>wdanish</code></a>, <a href="apt:wdutch"><code>wdutch</code></a>, <a href="apt:wfaroese"><code>wfaroese</code></a>, <a href="apt:wfrench"><code>wfrench</code></a>, <a href="apt:wgalician-minimos"><code>wgalician-minimos</code></a>, <a href="apt:wgerman-medical"><code>wgerman-medical</code></a>, <a href="apt:witalian"><code>witalian</code></a>, <a href="apt:wngerman"><code>wngerman</code></a>, <a href="apt:wnorwegian"><code>wnorwegian</code></a>, <a href="apt:wogerman"><code>wogerman</code></a>, <a href="apt:wpolish"><code>wpolish</code></a>, <a href="apt:wportuguese"><code>wportuguese</code></a>, <a href="apt:wspanish"><code>wspanish</code></a>, <a href="apt:wswedish"><code>wswedish</code></a>, <a href="apt:wswiss"><code>wswiss</code></a>, and <a href="apt:wukrainian"><code>wukrainian</code></a>.
- After installing them, I ran into a bit of an issue, one that is even present in the initial dictionary installed on the system.
- Namely, several non-<abbr title="American Standard Code for Information Interchange">ASCII</abbr> (and therefore unusable in onion addresses) characters were present.
- I do not want to simply leave out these words, and internationalization is not possible in onion addresses due to the lack of a dash character.
- While trying to make a list of unavailable characters that I would have to account for, I found that, according to <a href="file:///usr/share/dict/dutch"><code>/usr/share/dict/dutch</code></a>, some Dutch words contain digits, spaces, periods, slashes, and/or plus signs.
- Furthermore, "06" is supposedly a word, and in the case of a few words seemingly relating to carbon dioxide, words may contain a subscript "2".
- I am unsure how reliable this file really is.
- <a href="file:///usr/share/dict/ukrainian"><code>/usr/share/dict/ukrainian</code></a> predictably contains no Latin characters, instead consisting of Cyrillic letters.
- Using these words would mean not only making small changes here and there, but instead completely butchering every word.
- For that reason, there is a strong chance that I will not use the words in this file at all.
- Doing <strong>*any*</strong> sort of transformation of any words on these lists is a project for the distant future though.
- </p>
- <p>
- My <a href="/a/canary.txt">canary</a> still sings the tune of freedom and transparency.
- </p>
- <hr/>
- <p>
- Copyright © 2015 Alex Yst;
- You may modify and/or redistribute this document under the terms of the <a rel="license" href="/license/gpl-3.0-standalone.xhtml"><abbr title="GNU's Not Unix">GNU</abbr> <abbr title="General Public License version Three or later">GPLv3+</abbr></a>.
- If for some reason you would prefer to modify and/or distribute this document under other free copyleft terms, please ask me via email.
- My address is in the source comments near the top of this document.
- This license also applies to embedded content such as images.
- For more information on that, see <a href="/en/a/licensing.xhtml">licensing</a>.
- </p>
- <p>
- <abbr title="World Wide Web Consortium">W3C</abbr> standards are important.
- This document conforms to the <a href="https://validator.w3.org./nu/?doc=https%3A%2F%2Fy.st.%2Fen%2Fweblog%2F2015%2F11-November%2F21.xhtml"><abbr title="Extensible Hypertext Markup Language">XHTML</abbr> 5.1</a> specification and uses style sheets that conform to the <a href="http://jigsaw.w3.org./css-validator/validator?uri=https%3A%2F%2Fy.st.%2Fen%2Fweblog%2F2015%2F11-November%2F21.xhtml"><abbr title="Cascading Style Sheets">CSS</abbr>3</a> specification.
- </p>
- </body>
- </html>
|