forked from LBRYCommunity/lbry-sdk
157 lines
5.1 KiB
Python
157 lines
5.1 KiB
Python
import hashlib
|
|
import hmac
|
|
import math
|
|
import os
|
|
import pkgutil
|
|
import string
|
|
import unicodedata
|
|
import logging
|
|
import ecdsa
|
|
import pbkdf2
|
|
|
|
from . import constants
|
|
from .hashing import hmac_sha_512
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
# http://www.asahi-net.or.jp/~ax2s-kmtn/ref/unicode/e_asia.html
|
|
CJK_INTERVALS = [
|
|
(0x4E00, 0x9FFF, 'CJK Unified Ideographs'),
|
|
(0x3400, 0x4DBF, 'CJK Unified Ideographs Extension A'),
|
|
(0x20000, 0x2A6DF, 'CJK Unified Ideographs Extension B'),
|
|
(0x2A700, 0x2B73F, 'CJK Unified Ideographs Extension C'),
|
|
(0x2B740, 0x2B81F, 'CJK Unified Ideographs Extension D'),
|
|
(0xF900, 0xFAFF, 'CJK Compatibility Ideographs'),
|
|
(0x2F800, 0x2FA1D, 'CJK Compatibility Ideographs Supplement'),
|
|
(0x3190, 0x319F, 'Kanbun'),
|
|
(0x2E80, 0x2EFF, 'CJK Radicals Supplement'),
|
|
(0x2F00, 0x2FDF, 'CJK Radicals'),
|
|
(0x31C0, 0x31EF, 'CJK Strokes'),
|
|
(0x2FF0, 0x2FFF, 'Ideographic Description Characters'),
|
|
(0xE0100, 0xE01EF, 'Variation Selectors Supplement'),
|
|
(0x3100, 0x312F, 'Bopomofo'),
|
|
(0x31A0, 0x31BF, 'Bopomofo Extended'),
|
|
(0xFF00, 0xFFEF, 'Halfwidth and Fullwidth Forms'),
|
|
(0x3040, 0x309F, 'Hiragana'),
|
|
(0x30A0, 0x30FF, 'Katakana'),
|
|
(0x31F0, 0x31FF, 'Katakana Phonetic Extensions'),
|
|
(0x1B000, 0x1B0FF, 'Kana Supplement'),
|
|
(0xAC00, 0xD7AF, 'Hangul Syllables'),
|
|
(0x1100, 0x11FF, 'Hangul Jamo'),
|
|
(0xA960, 0xA97F, 'Hangul Jamo Extended A'),
|
|
(0xD7B0, 0xD7FF, 'Hangul Jamo Extended B'),
|
|
(0x3130, 0x318F, 'Hangul Compatibility Jamo'),
|
|
(0xA4D0, 0xA4FF, 'Lisu'),
|
|
(0x16F00, 0x16F9F, 'Miao'),
|
|
(0xA000, 0xA48F, 'Yi Syllables'),
|
|
(0xA490, 0xA4CF, 'Yi Radicals'),
|
|
]
|
|
|
|
|
|
def is_CJK(c):
|
|
n = ord(c)
|
|
for imin, imax, name in CJK_INTERVALS:
|
|
if imin <= n <= imax:
|
|
return True
|
|
return False
|
|
|
|
|
|
def prepare_seed(seed):
|
|
# normalize
|
|
seed = unicodedata.normalize('NFKD', unicode(seed))
|
|
# lower
|
|
seed = seed.lower()
|
|
# remove accents
|
|
seed = u''.join([c for c in seed if not unicodedata.combining(c)])
|
|
# normalize whitespaces
|
|
seed = u' '.join(seed.split())
|
|
# remove whitespaces between CJK
|
|
seed = u''.join([seed[i] for i in range(len(seed)) if not (seed[i] in string.whitespace
|
|
and is_CJK(seed[i - 1])
|
|
and is_CJK(seed[i + 1]))])
|
|
return seed
|
|
|
|
|
|
filenames = {
|
|
'en': 'english.txt',
|
|
'es': 'spanish.txt',
|
|
'ja': 'japanese.txt',
|
|
'pt': 'portuguese.txt',
|
|
'zh': 'chinese_simplified.txt'
|
|
}
|
|
|
|
|
|
class Mnemonic:
|
|
# Seed derivation no longer follows BIP39
|
|
# Mnemonic phrase uses a hash based checksum, instead of a wordlist-dependent checksum
|
|
|
|
def __init__(self, lang=None):
|
|
lang = lang or "en"
|
|
filename = filenames.get(lang[0:2], 'english.txt')
|
|
s = pkgutil.get_data('lbrynet', os.path.join('wallet', 'wordlist', filename))
|
|
s = unicodedata.normalize('NFKD', s.decode('utf8'))
|
|
lines = s.split('\n')
|
|
self.wordlist = []
|
|
for line in lines:
|
|
line = line.split('#')[0]
|
|
line = line.strip(' \r')
|
|
assert ' ' not in line
|
|
if line:
|
|
self.wordlist.append(line)
|
|
log.info("wordlist has %d words", len(self.wordlist))
|
|
|
|
@classmethod
|
|
def mnemonic_to_seed(cls, mnemonic, passphrase):
|
|
PBKDF2_ROUNDS = 2048
|
|
mnemonic = prepare_seed(mnemonic)
|
|
return pbkdf2.PBKDF2(mnemonic, 'lbryum' + passphrase, iterations=PBKDF2_ROUNDS,
|
|
macmodule=hmac, digestmodule=hashlib.sha512).read(64)
|
|
|
|
def mnemonic_encode(self, i):
|
|
n = len(self.wordlist)
|
|
words = []
|
|
while i:
|
|
x = i % n
|
|
i = i / n
|
|
words.append(self.wordlist[x])
|
|
return ' '.join(words)
|
|
|
|
def mnemonic_decode(self, seed):
|
|
n = len(self.wordlist)
|
|
words = seed.split()
|
|
i = 0
|
|
while words:
|
|
w = words.pop()
|
|
k = self.wordlist.index(w)
|
|
i = i * n + k
|
|
return i
|
|
|
|
def check_seed(self, seed, custom_entropy):
|
|
assert is_new_seed(seed)
|
|
i = self.mnemonic_decode(seed)
|
|
return i % custom_entropy == 0
|
|
|
|
def make_seed(self, num_bits=128, prefix=constants.SEED_PREFIX, custom_entropy=1):
|
|
n = int(math.ceil(math.log(custom_entropy, 2)))
|
|
# bits of entropy used by the prefix
|
|
k = len(prefix) * 4
|
|
# we add at least 16 bits
|
|
n_added = max(16, k + num_bits - n)
|
|
log.info("make_seed %s adding %d bits", prefix, n_added)
|
|
my_entropy = ecdsa.util.randrange(pow(2, n_added))
|
|
nonce = 0
|
|
while True:
|
|
nonce += 1
|
|
i = custom_entropy * (my_entropy + nonce)
|
|
seed = self.mnemonic_encode(i)
|
|
assert i == self.mnemonic_decode(seed)
|
|
if is_new_seed(seed, prefix):
|
|
break
|
|
log.info('%d words', len(seed.split()))
|
|
return seed
|
|
|
|
|
|
def is_new_seed(x, prefix=constants.SEED_PREFIX):
|
|
x = prepare_seed(x)
|
|
s = hmac_sha_512("Seed version", x.encode('utf8')).encode('hex')
|
|
return s.startswith(prefix)
|