aboutsummaryrefslogtreecommitdiff
path: root/src/mnemonics/electrum-words.cpp
diff options
context:
space:
mode:
Diffstat (limited to '')
-rw-r--r--src/mnemonics/electrum-words.cpp382
1 files changed, 181 insertions, 201 deletions
diff --git a/src/mnemonics/electrum-words.cpp b/src/mnemonics/electrum-words.cpp
index 334bc578f..7caa3f72b 100644
--- a/src/mnemonics/electrum-words.cpp
+++ b/src/mnemonics/electrum-words.cpp
@@ -41,6 +41,7 @@
#include <map>
#include <cstdint>
#include <vector>
+#include <unordered_map>
#include <boost/algorithm/string.hpp>
#include "crypto/crypto.h" // for declaration of crypto::secret_key
#include <fstream>
@@ -55,97 +56,93 @@
#include "portuguese.h"
#include "japanese.h"
#include "old_english.h"
+#include "language_base.h"
+#include "singleton.h"
namespace
{
- int num_words = 0;
const int seed_length = 24;
- std::map<std::string,uint32_t> words_map;
- std::vector<std::string> words_array;
-
- bool is_old_style_word_list = false;
-
- const std::string WORD_LISTS_DIRECTORY = "wordlists";
- const std::string LANGUAGES_DIRECTORY = "languages";
- const std::string OLD_WORD_FILE = "old-word-list";
-
- const int unique_prefix_length = 4;
/*!
- * \brief Tells if the module hasn't been initialized with a word list file.
- * \return true if the module hasn't been initialized with a word list file false otherwise.
+ * \brief Finds the word list that contains the seed words and puts the indices
+ * where matches occured in matched_indices.
+ * \param seed List of words to match.
+ * \param has_checksum If word list passed checksum test, we need to only do a prefix check.
+ * \param matched_indices The indices where the seed words were found are added to this.
+ * \return true if all the words were present in some language false if not.
*/
- bool is_uninitialized()
+ bool find_seed_language(const std::vector<std::string> &seed,
+ bool has_checksum, std::vector<uint32_t> &matched_indices, uint32_t &word_list_length,
+ std::string &language_name)
{
- return num_words == 0 ? true : false;
- }
-
- /*!
- * \brief Create word list map and array data structres for use during inter-conversion between
- * words and secret key.
- * \param word_file Path to the word list file from pwd.
- * \param has_checksum True if checksum was supplied false if not.
- */
- void create_data_structures(const std::string &word_file, bool has_checksum)
- {
- words_array.clear();
- words_map.clear();
- num_words = 0;
- std::ifstream input_stream;
- input_stream.open(word_file.c_str(), std::ifstream::in);
-
- if (!input_stream)
- throw std::runtime_error("Word list file couldn't be opened.");
-
- std::string word;
- while (input_stream >> word)
+ // If there's a new language added, add an instance of it here.
+ std::vector<Language::Base*> language_instances({
+ Language::Singleton<Language::English>::instance(),
+ Language::Singleton<Language::Spanish>::instance(),
+ Language::Singleton<Language::Portuguese>::instance(),
+ Language::Singleton<Language::Japanese>::instance(),
+ Language::Singleton<Language::OldEnglish>::instance()
+ });
+ // To hold trimmed seed words in case of a checksum being present.
+ std::vector<std::string> trimmed_seed;
+ if (has_checksum)
{
- if (word.length() == 0 || word[0] == '#')
- {
- // Skip empty and comment lines
- continue;
- }
- words_array.push_back(word);
- if (has_checksum)
+ // If it had a checksum, we'll just compare the unique prefix
+ // So we create a list of trimmed seed words
+ for (std::vector<std::string>::const_iterator it = seed.begin(); it != seed.end(); it++)
{
- // Only if checksum was passed should we stick to just 4 char checks to be lenient about typos.
- words_map[word.substr(0, unique_prefix_length)] = num_words;
+ trimmed_seed.push_back(it->length() > Language::unique_prefix_length ?
+ it->substr(0, Language::unique_prefix_length) : *it);
}
- else
- {
- words_map[word] = num_words;
- }
- num_words++;
}
- input_stream.close();
- }
-
- /*!
- * \brief Tells if all the words passed in wlist was present in current word list file.
- * \param wlist List of words to match.
- * \param has_checksum If word list passed checksum test, we need to only do a 4 char check.
- * \return true if all the words were present false if not.
- */
- bool word_list_file_match(const std::vector<std::string> &wlist, bool has_checksum)
- {
- for (std::vector<std::string>::const_iterator it = wlist.begin(); it != wlist.end(); it++)
+ std::unordered_map<std::string, uint32_t> word_map;
+ std::unordered_map<std::string, uint32_t> trimmed_word_map;
+ // Iterate through all the languages and find a match
+ for (std::vector<Language::Base*>::iterator it1 = language_instances.begin();
+ it1 != language_instances.end(); it1++)
{
- if (has_checksum)
+ word_map = (*it1)->get_word_map();
+ trimmed_word_map = (*it1)->get_trimmed_word_map();
+ // To iterate through seed words
+ std::vector<std::string>::const_iterator it2;
+ // To iterate through trimmed seed words
+ std::vector<std::string>::iterator it3;
+ bool full_match = true;
+
+ // Iterate through all the words and see if they're all present
+ for (it2 = seed.begin(), it3 = trimmed_seed.begin();
+ it2 != seed.end() && it3 != trimmed_seed.end(); it2++, it3++)
{
- if (words_map.count(it->substr(0, unique_prefix_length)) == 0)
+ if (has_checksum)
{
- return false;
+ // Use the trimmed words and map
+ if (trimmed_word_map.count(*it3) == 0)
+ {
+ full_match = false;
+ break;
+ }
+ matched_indices.push_back(trimmed_word_map[*it3]);
}
- }
- else
- {
- if (words_map.count(*it) == 0)
+ else
{
- return false;
+ if (word_map.count(*it2) == 0)
+ {
+ full_match = false;
+ break;
+ }
+ matched_indices.push_back(word_map[*it2]);
}
}
+ if (full_match)
+ {
+ word_list_length = (*it1)->get_word_list().size();
+ language_name = (*it1)->get_language_name();
+ return true;
+ }
+ // Some didn't match. Clear the index array.
+ matched_indices.clear();
}
- return true;
+ return false;
}
/*!
@@ -155,16 +152,43 @@ namespace
*/
uint32_t create_checksum_index(const std::vector<std::string> &word_list)
{
- std::string four_char_words = "";
+ std::string trimmed_words = "";
for (std::vector<std::string>::const_iterator it = word_list.begin(); it != word_list.end(); it++)
{
- four_char_words += it->substr(0, unique_prefix_length);
+ if (it->length() > 4)
+ {
+ trimmed_words += it->substr(0, Language::unique_prefix_length);
+ }
+ else
+ {
+ trimmed_words += *it;
+ }
}
boost::crc_32_type result;
- result.process_bytes(four_char_words.data(), four_char_words.length());
+ result.process_bytes(trimmed_words.data(), trimmed_words.length());
return result.checksum() % seed_length;
}
+
+ /*!
+ * \brief Does the checksum test on the seed passed.
+ * \param seed Vector of seed words
+ * \return True if the test passed false if not.
+ */
+ bool checksum_test(std::vector<std::string> seed)
+ {
+ // The last word is the checksum.
+ std::string last_word = seed.back();
+ seed.pop_back();
+
+ std::string checksum = seed[create_checksum_index(seed)];
+
+ std::string trimmed_checksum = checksum.length() > 4 ? checksum.substr(0, Language::unique_prefix_length) :
+ checksum;
+ std::string trimmed_last_word = checksum.length() > 4 ? last_word.substr(0, Language::unique_prefix_length) :
+ last_word;
+ return trimmed_checksum == trimmed_last_word;
+ }
}
/*!
@@ -182,114 +206,62 @@ namespace crypto
namespace ElectrumWords
{
/*!
- * \brief Called to initialize it to work with a word list file.
- * \param language Language of the word list file.
- * \param has_checksum True if the checksum was passed false if not.
- * \param old_word_list true it is to use the old style word list file false if not.
- */
- void init(const std::string &language, bool has_checksum, bool old_word_list)
- {
- if (old_word_list)
- {
- // Use the old word list file if told to.
- create_data_structures(WORD_LISTS_DIRECTORY + '/' + OLD_WORD_FILE, has_checksum);
- is_old_style_word_list = true;
- }
- else
- {
- create_data_structures(WORD_LISTS_DIRECTORY + '/' + LANGUAGES_DIRECTORY + '/' + language, has_checksum);
- is_old_style_word_list = false;
- }
- if (num_words == 0)
- {
- throw std::runtime_error(std::string("Word list file is empty: ") +
- (old_word_list ? OLD_WORD_FILE : (LANGUAGES_DIRECTORY + '/' + language)));
- }
- }
-
- /*!
* \brief Converts seed words to bytes (secret key).
- * \param words String containing the words separated by spaces.
- * \param dst To put the secret key restored from the words.
- * \return false if not a multiple of 3 words, or if word is not in the words list
+ * \param words String containing the words separated by spaces.
+ * \param dst To put the secret key restored from the words.
+ * \param language_name Language of the seed as found gets written here.
+ * \return false if not a multiple of 3 words, or if word is not in the words list
*/
- bool words_to_bytes(const std::string& words, crypto::secret_key& dst)
+ bool words_to_bytes(const std::string& words, crypto::secret_key& dst,
+ std::string &language_name)
{
- std::vector<std::string> wlist;
+ std::vector<std::string> seed;
- boost::split(wlist, words, boost::is_any_of(" "));
+ boost::split(seed, words, boost::is_any_of(" "));
- // If it is seed with a checksum.
- bool has_checksum = (wlist.size() == seed_length + 1);
+ // error on non-compliant word list
+ if (seed.size() != seed_length/2 && seed.size() != seed_length &&
+ seed.size() != seed_length + 1)
+ {
+ return false;
+ }
+ // If it is seed with a checksum.
+ bool has_checksum = seed.size() == (seed_length + 1);
if (has_checksum)
{
- // The last word is the checksum.
- std::string last_word = wlist.back();
- wlist.pop_back();
-
- std::string checksum = wlist[create_checksum_index(wlist)];
-
- if (checksum.substr(0, unique_prefix_length) != last_word.substr(0, unique_prefix_length))
+ if (!checksum_test(seed))
{
// Checksum fail
return false;
}
}
- // Try to find a word list file that contains all the words in the word list.
- std::vector<std::string> languages;
- get_language_list(languages);
-
- std::vector<std::string>::iterator it;
- for (it = languages.begin(); it != languages.end(); it++)
- {
- init(*it, has_checksum);
- if (word_list_file_match(wlist, has_checksum))
- {
- break;
- }
- }
- // If no such file was found, see if the old style word list file has them all.
- if (it == languages.end())
+
+ std::vector<uint32_t> matched_indices;
+ uint32_t word_list_length;
+ if (!find_seed_language(seed, has_checksum, matched_indices, word_list_length, language_name))
{
- init("", has_checksum, true);
- if (!word_list_file_match(wlist, has_checksum))
- {
- return false;
- }
+ return false;
}
- int n = num_words;
-
- // error on non-compliant word list
- if (wlist.size() != 12 && wlist.size() != 24) return false;
- for (unsigned int i=0; i < wlist.size() / 3; i++)
+ for (unsigned int i=0; i < seed.size() / 3; i++)
{
uint32_t val;
uint32_t w1, w2, w3;
+ w1 = matched_indices[i*3];
+ w2 = matched_indices[i*3 + 1];
+ w3 = matched_indices[i*3 + 2];
- if (has_checksum)
- {
- w1 = words_map.at(wlist[i*3].substr(0, unique_prefix_length));
- w2 = words_map.at(wlist[i*3 + 1].substr(0, unique_prefix_length));
- w3 = words_map.at(wlist[i*3 + 2].substr(0, unique_prefix_length));
- }
- else
- {
- w1 = words_map.at(wlist[i*3]);
- w2 = words_map.at(wlist[i*3 + 1]);
- w3 = words_map.at(wlist[i*3 + 2]);
- }
+ val = w1 + word_list_length * (((word_list_length - w1) + w2) % word_list_length) +
+ word_list_length * word_list_length * (((word_list_length - w2) + w3) % word_list_length);
- val = w1 + n * (((n - w1) + w2) % n) + n * n * (((n - w2) + w3) % n);
-
- if (!(val % n == w1)) return false;
+ if (!(val % word_list_length == w1)) return false;
memcpy(dst.data + i * 4, &val, 4); // copy 4 bytes to position
}
std::string wlist_copy = words;
- if (wlist.size() == 12)
+ if (seed.size() == seed_length/2)
{
memcpy(dst.data, dst.data + 16, 16); // if electrum 12-word seed, duplicate
wlist_copy += ' ';
@@ -301,23 +273,44 @@ namespace crypto
/*!
* \brief Converts bytes (secret key) to seed words.
- * \param src Secret key
- * \param words Space delimited concatenated words get written here.
- * \return true if successful false if not. Unsuccessful if wrong key size.
+ * \param src Secret key
+ * \param words Space delimited concatenated words get written here.
+ * \param language_name Seed language name
+ * \return true if successful false if not. Unsuccessful if wrong key size.
*/
- bool bytes_to_words(const crypto::secret_key& src, std::string& words)
+ bool bytes_to_words(const crypto::secret_key& src, std::string& words,
+ const std::string &language_name)
{
- if (is_uninitialized())
+
+ if (sizeof(src.data) % 4 != 0 || sizeof(src.data) == 0) return false;
+
+ std::vector<std::string> word_list;
+ Language::Base *language;
+ if (language_name == "English")
{
- init("english", true);
+ language = Language::Singleton<Language::English>::instance();
}
-
+ else if (language_name == "Spanish")
+ {
+ language = Language::Singleton<Language::Spanish>::instance();
+ }
+ else if (language_name == "Portuguese")
+ {
+ language = Language::Singleton<Language::Portuguese>::instance();
+ }
+ else if (language_name == "Japanese")
+ {
+ language = Language::Singleton<Language::Japanese>::instance();
+ }
+ else
+ {
+ return false;
+ }
+ word_list = language->get_word_list();
// To store the words for random access to add the checksum word later.
std::vector<std::string> words_store;
- int n = num_words;
-
- if (sizeof(src.data) % 4 != 0 || sizeof(src.data) == 0) return false;
+ uint32_t word_list_length = word_list.size();
// 8 bytes -> 3 words. 8 digits base 16 -> 3 digits base 1626
for (unsigned int i=0; i < sizeof(src.data)/4; i++, words += ' ')
{
@@ -327,19 +320,19 @@ namespace crypto
memcpy(&val, (src.data) + (i * 4), 4);
- w1 = val % n;
- w2 = ((val / n) + w1) % n;
- w3 = (((val / n) / n) + w2) % n;
+ w1 = val % word_list_length;
+ w2 = ((val / word_list_length) + w1) % word_list_length;
+ w3 = (((val / word_list_length) / word_list_length) + w2) % word_list_length;
- words += words_array[w1];
+ words += word_list[w1];
words += ' ';
- words += words_array[w2];
+ words += word_list[w2];
words += ' ';
- words += words_array[w3];
+ words += word_list[w3];
- words_store.push_back(words_array[w1]);
- words_store.push_back(words_array[w2]);
- words_store.push_back(words_array[w3]);
+ words_store.push_back(word_list[w1]);
+ words_store.push_back(word_list[w2]);
+ words_store.push_back(word_list[w3]);
}
words.pop_back();
@@ -353,31 +346,18 @@ namespace crypto
*/
void get_language_list(std::vector<std::string> &languages)
{
- languages.clear();
- boost::filesystem::path languages_directory("wordlists/languages");
- if (!boost::filesystem::exists(languages_directory) ||
- !boost::filesystem::is_directory(languages_directory))
- {
- throw std::runtime_error("Word list languages directory is missing.");
- }
- boost::filesystem::directory_iterator end;
- for (boost::filesystem::directory_iterator it(languages_directory); it != end; it++)
- {
- languages.push_back(it->path().filename().string());
- }
- }
-
- /*!
- * \brief Tells if the module is currenly using an old style word list.
- * \return true if it is currenly using an old style word list false if not.
- */
- bool get_is_old_style_word_list()
- {
- if (is_uninitialized())
+ std::vector<Language::Base*> language_instances({
+ Language::Singleton<Language::English>::instance(),
+ Language::Singleton<Language::Spanish>::instance(),
+ Language::Singleton<Language::Portuguese>::instance(),
+ Language::Singleton<Language::Japanese>::instance(),
+ Language::Singleton<Language::OldEnglish>::instance()
+ });
+ for (std::vector<Language::Base*>::iterator it = language_instances.begin();
+ it != language_instances.end(); it++)
{
- throw std::runtime_error("ElectrumWords hasn't been initialized with a word list yet.");
+ languages.push_back((*it)->get_language_name());
}
- return is_old_style_word_list;
}
/*!
@@ -387,9 +367,9 @@ namespace crypto
*/
bool get_is_old_style_seed(const std::string &seed)
{
- std::vector<std::string> wlist;
- boost::split(wlist, seed, boost::is_any_of(" "));
- return wlist.size() != (seed_length + 1);
+ std::vector<std::string> word_list;
+ boost::split(word_list, seed, boost::is_any_of(" "));
+ return word_list.size() != (seed_length + 1);
}
}