base.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381
  1. #!/usr/bin/env python3
  2. #
  3. # MMGen Wallet, a terminal-based cryptocurrency wallet
  4. # Copyright (C)2013-2025 The MMGen Project <mmgen@tuta.io>
  5. # Licensed under the GNU General Public License, Version 3:
  6. # https://www.gnu.org/licenses
  7. # Public project repositories:
  8. # https://github.com/mmgen/mmgen-wallet
  9. # https://gitlab.com/mmgen/mmgen-wallet
  10. """
  11. proto.btc.tx.base: Bitcoin base transaction class
  12. """
  13. from collections import namedtuple
  14. from ....tx.base import Base as TxBase
  15. from ....obj import MMGenList, HexStr, ListItemAttr
  16. from ....util import msg, make_chksum_6, die, pp_fmt
  17. from .op_return_data import OpReturnData
  18. def data2scriptPubKey(data):
  19. return '6a' + '{:02x}'.format(len(data)) + data.hex() # OP_RETURN data
  20. def addr2scriptPubKey(proto, addr):
  21. def decode_addr(proto, addr):
  22. ap = proto.decode_addr(addr)
  23. assert ap, f'coin address {addr!r} could not be parsed'
  24. return ap.bytes.hex()
  25. return {
  26. 'p2pkh': '76a914' + decode_addr(proto, addr) + '88ac',
  27. 'p2sh': 'a914' + decode_addr(proto, addr) + '87',
  28. 'bech32': proto.witness_vernum_hex + '14' + decode_addr(proto, addr)
  29. }[addr.addr_fmt]
  30. def decodeScriptPubKey(proto, s):
  31. # src/wallet/rpc/addresses.cpp:
  32. # types: nonstandard, pubkey, pubkeyhash, scripthash, multisig, nulldata, witness_v0_keyhash
  33. ret = namedtuple('decoded_scriptPubKey', ['type', 'addr_fmt', 'addr', 'data'])
  34. if len(s) == 50 and s[:6] == '76a914' and s[-4:] == '88ac':
  35. return ret('pubkeyhash', 'p2pkh', proto.pubhash2addr(bytes.fromhex(s[6:-4]), 'p2pkh'), None)
  36. elif len(s) == 46 and s[:4] == 'a914' and s[-2:] == '87':
  37. return ret('scripthash', 'p2sh', proto.pubhash2addr(bytes.fromhex(s[4:-2]), 'p2sh'), None)
  38. elif len(s) == 44 and s[:4] == proto.witness_vernum_hex + '14':
  39. return ret('witness_v0_keyhash', 'bech32', proto.pubhash2bech32addr(bytes.fromhex(s[4:])), None)
  40. elif s[:2] == '6a': # OP_RETURN
  41. # range 1-80 == hex 2-160, plus 4 for opcode byte + push byte
  42. if 6 <= len(s) <= (proto.max_op_return_data_len * 2) + 6: # 2-160 -> 6-166
  43. return ret('nulldata', None, None, s[4:]) # return data in hex format
  44. else:
  45. raise ValueError('{}: OP_RETURN data bytes length not in range 1-{}'.format(
  46. len(s[4:]) // 2,
  47. proto.max_op_return_data_len))
  48. else:
  49. raise NotImplementedError(f'Unrecognized scriptPubKey ({s})')
  50. def DeserializeTX(proto, txhex):
  51. """
  52. Parse a serialized Bitcoin transaction
  53. For checking purposes, additionally reconstructs the serialized TX without signature
  54. """
  55. def bytes2int(bytes_le):
  56. return int(bytes_le[::-1].hex(), 16)
  57. def bytes2coin_amt(bytes_le):
  58. return proto.coin_amt(bytes2int(bytes_le), from_unit='satoshi')
  59. def bshift(n, *, skip=False, sub_null=False):
  60. nonlocal idx, raw_tx
  61. ret = tx[idx:idx+n]
  62. idx += n
  63. if sub_null:
  64. raw_tx += b'\x00'
  65. elif not skip:
  66. raw_tx += ret
  67. return ret
  68. # https://bitcoin.org/en/developer-reference#compactsize-unsigned-integers
  69. # For example, the number 515 is encoded as 0xfd0302.
  70. def readVInt(*, skip=False):
  71. nonlocal idx, raw_tx
  72. s = tx[idx]
  73. idx += 1
  74. if not skip:
  75. raw_tx.append(s)
  76. vbytes_len = 1 if s < 0xfd else 2 if s == 0xfd else 4 if s == 0xfe else 8
  77. if vbytes_len == 1:
  78. return s
  79. else:
  80. vbytes = tx[idx:idx+vbytes_len]
  81. idx += vbytes_len
  82. if not skip:
  83. raw_tx += vbytes
  84. return int(vbytes[::-1].hex(), 16)
  85. def make_txid(tx_bytes):
  86. from hashlib import sha256
  87. return sha256(sha256(tx_bytes).digest()).digest()[::-1].hex()
  88. tx = bytes.fromhex(txhex)
  89. raw_tx = bytearray()
  90. idx = 0
  91. d = {'version': bytes2int(bshift(4))}
  92. if d['version'] > 0x7fffffff: # version is signed integer
  93. die(3, f"{d['version']}: transaction version greater than maximum allowed value (int32_t)!")
  94. has_witness = tx[idx] == 0
  95. if has_witness:
  96. u = bshift(2, skip=True).hex()
  97. if u != '0001':
  98. die('IllegalWitnessFlagValue', f'{u!r}: Illegal value for flag in transaction!')
  99. d['num_txins'] = readVInt()
  100. d['txins'] = MMGenList([{
  101. 'txid': bshift(32)[::-1].hex(),
  102. 'vout': bytes2int(bshift(4)),
  103. 'scriptSig': bshift(readVInt(skip=True), sub_null=True).hex(),
  104. 'nSeq': bshift(4)[::-1].hex()
  105. } for i in range(d['num_txins'])])
  106. d['num_txouts'] = readVInt()
  107. d['txouts'] = MMGenList([{
  108. 'amt': bytes2coin_amt(bshift(8)),
  109. 'scriptPubKey': bshift(readVInt()).hex()
  110. } for i in range(d['num_txouts'])])
  111. for o in d['txouts']:
  112. o.update(decodeScriptPubKey(proto, o['scriptPubKey'])._asdict())
  113. if has_witness:
  114. # https://github.com/bitcoin/bips/blob/master/bip-0141.mediawiki
  115. # A non-witness program (defined hereinafter) txin MUST be associated with an empty
  116. # witness field, represented by a 0x00.
  117. d['txid'] = make_txid(tx[:4] + tx[6:idx] + tx[-4:])
  118. d['witness_size'] = len(tx) - idx + 2 - 4 # add len(marker+flag), subtract len(locktime)
  119. for txin in d['txins']:
  120. if tx[idx] == 0:
  121. bshift(1, skip=True)
  122. continue
  123. txin['witness'] = [
  124. bshift(readVInt(skip=True), skip=True).hex() for item in range(readVInt(skip=True))]
  125. else:
  126. d['txid'] = make_txid(tx)
  127. d['witness_size'] = 0
  128. if len(tx) - idx != 4:
  129. die('TxHexParseError', 'TX hex has invalid length: {} extra bytes'.format(len(tx)-idx-4))
  130. d['locktime'] = bytes2int(bshift(4))
  131. d['unsigned_hex'] = raw_tx.hex()
  132. return namedtuple('deserialized_tx', list(d.keys()))(**d)
  133. class Base(TxBase):
  134. rel_fee_desc = 'satoshis per byte'
  135. rel_fee_disp = 'sat/byte'
  136. _deserialized = None
  137. class Output(TxBase.Output): # output contains either addr or data, but not both
  138. data = ListItemAttr(OpReturnData, include_proto=True) # type None in parent cls
  139. class InputList(TxBase.InputList):
  140. # Lexicographical Indexing of Transaction Inputs and Outputs
  141. # https://github.com/bitcoin/bips/blob/master/bip-0069.mediawiki
  142. def sort_bip69(self):
  143. def sort_func(a):
  144. return (
  145. bytes.fromhex(a.txid)
  146. + int.to_bytes(a.vout, 4, 'big'))
  147. self.sort(key=sort_func)
  148. class OutputList(TxBase.OutputList):
  149. def sort_bip69(self):
  150. def sort_func(a):
  151. return (
  152. int.to_bytes(a.amt.to_unit('satoshi'), 8, 'big')
  153. + bytes.fromhex(
  154. addr2scriptPubKey(self.parent.proto, a.addr) if a.addr else
  155. data2scriptPubKey(a.data)))
  156. self.sort(key=sort_func)
  157. def has_segwit_inputs(self):
  158. return any(i.mmtype in ('S', 'B') for i in self.inputs)
  159. def has_segwit_outputs(self):
  160. return any(o.mmtype in ('S', 'B') for o in self.outputs)
  161. # https://bitcoin.stackexchange.com/questions/1195/how-to-calculate-transaction-size-before-sending
  162. # 180: uncompressed, 148: compressed
  163. def estimate_size_old(self):
  164. if not self.inputs or not self.outputs:
  165. return None
  166. return len(self.inputs)*180 + len(self.outputs)*34 + 10
  167. # https://bitcoincore.org/en/segwit_wallet_dev/
  168. # vsize: 3 times of the size with original serialization, plus the size with new
  169. # serialization, divide the result by 4 and round up to the next integer.
  170. # TODO: results differ slightly from actual transaction size
  171. def estimate_size(self):
  172. if not self.inputs or not self.outputs:
  173. return None
  174. sig_size = 72 # sig in DER format
  175. pubkey_size_uncompressed = 65
  176. pubkey_size_compressed = 33
  177. def get_inputs_size():
  178. # txid vout [scriptSig size (vInt)] scriptSig (<sig> <pubkey>) nSeq
  179. isize_common = 32 + 4 + 1 + 4 # txid vout [scriptSig size] nSeq = 41
  180. input_size = {
  181. 'L': isize_common + sig_size + pubkey_size_uncompressed, # = 180
  182. 'C': isize_common + sig_size + pubkey_size_compressed, # = 148
  183. 'S': isize_common + 23, # = 64
  184. 'B': isize_common + 0 # = 41
  185. }
  186. ret = sum(input_size[i.mmtype] for i in self.inputs if i.mmtype)
  187. # We have no way of knowing whether a non-MMGen P2PKH addr is compressed or uncompressed
  188. # until we see the key, so assume compressed for fee-estimation purposes. If fee estimate
  189. # is off by more than 5%, sign() aborts and user is instructed to use --vsize-adj option.
  190. return ret + sum(input_size['C'] for i in self.inputs if not i.mmtype)
  191. def get_outputs_size():
  192. # output bytes:
  193. # 8 (amt) + scriptlen_byte + script_bytes
  194. # script_bytes:
  195. # ADDR: p2pkh: 25, p2sh: 23, bech32: 22
  196. # DATA: opcode_byte ('6a') + push_byte + nulldata_bytes
  197. return sum(
  198. {'p2pkh':34, 'p2sh':32, 'bech32':31}[o.addr.addr_fmt] if o.addr else
  199. (11 + len(o.data)) if o.data else
  200. # guess value if o.addr is missing (probably a vault address):
  201. 34 if self.proto.coin == 'BCH' else
  202. 31
  203. for o in self.outputs)
  204. # https://github.com/bitcoin/bips/blob/master/bip-0141.mediawiki
  205. # The witness is a serialization of all witness data of the transaction. Each txin is
  206. # associated with a witness field. A witness field starts with a var_int to indicate the
  207. # number of stack items for the txin. It is followed by stack items, with each item starts
  208. # with a var_int to indicate the length. Witness data is NOT script.
  209. # A non-witness program txin MUST be associated with an empty witness field, represented
  210. # by a 0x00. If all txins are not witness program, a transaction's wtxid is equal to its txid.
  211. def get_witness_size():
  212. if not self.has_segwit_inputs():
  213. return 0
  214. wf_size = 1 + 1 + sig_size + 1 + pubkey_size_compressed # vInt vInt sig vInt pubkey = 108
  215. return sum((1, wf_size)[i.mmtype in ('S', 'B')] for i in self.inputs)
  216. isize = get_inputs_size()
  217. osize = get_outputs_size()
  218. wsize = get_witness_size()
  219. # TODO: compute real varInt sizes instead of assuming 1 byte
  220. # Serialization:
  221. # old: [nVersion] [vInt][txins][vInt][txouts] [nLockTime]
  222. old_size = 4 + 1 + isize + 1 + osize + 4
  223. # marker = 0x00, flag = 0x01
  224. # new: [nVersion][marker][flag][vInt][txins][vInt][txouts][witness][nLockTime]
  225. new_size = 4 + 1 + 1 + 1 + isize + 1 + osize + wsize + 4 if wsize else old_size
  226. ret = (old_size * 3 + new_size) // 4
  227. self.cfg._util.dmsg(
  228. '\nData from estimate_size():\n' +
  229. f' inputs size: {isize}, outputs size: {osize}, witness size: {wsize}\n' +
  230. f' size: {new_size}, vsize: {ret}, old_size: {old_size}')
  231. return int(ret * (self.cfg.vsize_adj or 1))
  232. # convert absolute CoinAmt fee to sat/byte for display using estimated size
  233. def fee_abs2rel(self, abs_fee, *, to_unit='satoshi'):
  234. return str(int(
  235. abs_fee /
  236. getattr(self.proto.coin_amt, to_unit) /
  237. self.estimate_size()))
  238. @property
  239. def data_output(self):
  240. res = self.data_outputs
  241. if len(res) > 1:
  242. raise ValueError(f'{res}: too many data outputs in transaction (only one allowed)')
  243. return res[0] if len(res) == 1 else None
  244. @data_output.setter
  245. def data_output(self, val):
  246. dbool = [bool(o.data) for o in self.outputs]
  247. if dbool.count(True) != 1:
  248. raise ValueError('more or less than one data output in transaction!')
  249. self.outputs[dbool.index(True)] = val
  250. @property
  251. def data_outputs(self):
  252. return [o for o in self.outputs if o.data]
  253. @property
  254. def nondata_outputs(self):
  255. return [o for o in self.outputs if not o.data]
  256. @property
  257. def deserialized(self):
  258. if not self._deserialized:
  259. self._deserialized = DeserializeTX(self.proto, self.serialized)
  260. return self._deserialized
  261. def update_serialized(self, data):
  262. self.serialized = HexStr(data)
  263. self._deserialized = None
  264. self.check_serialized_integrity()
  265. def check_serialized_integrity(self):
  266. """
  267. Check that a malicious, compromised or malfunctioning coin daemon hasn't produced bad
  268. serialized tx data.
  269. Does not check witness data.
  270. Perform this check every time a serialized tx is received from the coin daemon or read
  271. from a transaction file.
  272. """
  273. def do_error(errmsg):
  274. die('TxHexMismatch', errmsg+'\n'+hdr)
  275. def check_equal(desc, hexio, mmio):
  276. if mmio != hexio:
  277. msg('\nMMGen {d}:\n{m}\nSerialized {d}:\n{h}'.format(
  278. d = desc,
  279. m = pp_fmt(mmio),
  280. h = pp_fmt(hexio)))
  281. do_error(
  282. f'{desc.capitalize()} in serialized transaction data from coin daemon ' +
  283. 'do not match those in MMGen transaction!')
  284. hdr = 'A malicious or malfunctioning coin daemon or other program may have altered your data!'
  285. dtx = self.deserialized
  286. if dtx.locktime != int(self.locktime or 0):
  287. do_error(
  288. f'Transaction hex nLockTime ({dtx.locktime}) ' +
  289. f'does not match MMGen transaction nLockTime ({self.locktime})')
  290. check_equal(
  291. 'sequence numbers',
  292. [i['nSeq'] for i in dtx.txins],
  293. ['{:08x}'.format(i.sequence or self.proto.max_int) for i in self.inputs])
  294. check_equal(
  295. 'inputs',
  296. sorted((i['txid'], i['vout']) for i in dtx.txins),
  297. sorted((i.txid, i.vout) for i in self.inputs))
  298. check_equal(
  299. 'outputs',
  300. sorted((o['addr'] or o['data'], o['amt']) for o in dtx.txouts),
  301. sorted((o.addr or o.data.hex(), o.amt) for o in self.outputs))
  302. if str(self.txid) != make_chksum_6(bytes.fromhex(dtx.unsigned_hex)).upper():
  303. do_error(f'MMGen TxID ({self.txid}) does not match serialized transaction data!')