2022-06-29 04:05:31 +00:00
|
|
|
// Written in 2019 by Andrew Poelstra <apoelstra@wpsoftware.net>
|
|
|
|
// SPDX-License-Identifier: CC0-1.0
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
// This module was largely copied from https://github.com/rust-bitcoin/murmel/blob/master/src/blockfilter.rs
|
|
|
|
// on 11. June 2019 which is licensed under Apache, that file specifically
|
|
|
|
// was written entirely by Tamas Blummer, who is re-licensing its contents here as CC0.
|
|
|
|
|
2022-08-09 04:50:41 +00:00
|
|
|
//! BIP 158 Compact Block Filters for Light Clients.
|
2019-07-26 07:36:25 +00:00
|
|
|
//!
|
2021-11-05 21:58:18 +00:00
|
|
|
//! This module implements a structure for compact filters on block data, for
|
|
|
|
//! use in the BIP 157 light client protocol. The filter construction proposed
|
|
|
|
//! is an alternative to Bloom filters, as used in BIP 37, that minimizes filter
|
|
|
|
//! size by using Golomb-Rice coding for compression.
|
2019-07-26 07:36:25 +00:00
|
|
|
//!
|
2022-08-09 04:50:41 +00:00
|
|
|
//! ### Relevant BIPS
|
|
|
|
//!
|
|
|
|
//! * [BIP 157 - Client Side Block Filtering](https://github.com/bitcoin/bips/blob/master/bip-0157.mediawiki)
|
|
|
|
//! * [BIP 158 - Compact Block Filters for Light Clients](https://github.com/bitcoin/bips/blob/master/bip-0158.mediawiki)
|
|
|
|
//!
|
|
|
|
//! # Examples
|
2021-02-17 20:35:13 +00:00
|
|
|
//!
|
|
|
|
//! ```ignore
|
|
|
|
//! fn get_script_for_coin(coin: &OutPoint) -> Result<Script, BlockFilterError> {
|
|
|
|
//! // get utxo ...
|
|
|
|
//! }
|
2022-01-24 00:24:32 +00:00
|
|
|
//!
|
2021-02-17 20:35:13 +00:00
|
|
|
//! // create a block filter for a block (server side)
|
|
|
|
//! let filter = BlockFilter::new_script_filter(&block, get_script_for_coin)?;
|
|
|
|
//!
|
|
|
|
//! // or create a filter from known raw data
|
|
|
|
//! let filter = BlockFilter::new(content);
|
2022-01-24 00:24:32 +00:00
|
|
|
//!
|
2021-02-17 20:35:13 +00:00
|
|
|
//! // read and evaluate a filter
|
2022-01-24 00:24:32 +00:00
|
|
|
//!
|
2021-02-17 20:35:13 +00:00
|
|
|
//! let query: Iterator<Item=Script> = // .. some scripts you care about
|
|
|
|
//! if filter.match_any(&block_hash, &mut query.map(|s| s.as_bytes())) {
|
|
|
|
//! // get this block
|
|
|
|
//! }
|
|
|
|
//! ```
|
2022-01-24 00:24:32 +00:00
|
|
|
//!
|
2019-07-26 07:36:25 +00:00
|
|
|
|
2022-05-02 22:13:57 +00:00
|
|
|
use crate::prelude::*;
|
2022-08-08 05:30:26 +00:00
|
|
|
use crate::io;
|
2021-06-09 10:34:44 +00:00
|
|
|
|
2021-06-09 10:40:41 +00:00
|
|
|
use core::fmt::{self, Display, Formatter};
|
|
|
|
use core::cmp::{self, Ordering};
|
2019-07-26 07:36:25 +00:00
|
|
|
|
2022-05-02 22:13:57 +00:00
|
|
|
use crate::hashes::{Hash, siphash24};
|
|
|
|
use crate::hash_types::{BlockHash, FilterHash, FilterHeader};
|
2019-07-26 07:36:25 +00:00
|
|
|
|
2022-05-02 22:13:57 +00:00
|
|
|
use crate::blockdata::block::Block;
|
|
|
|
use crate::blockdata::script::Script;
|
|
|
|
use crate::blockdata::transaction::OutPoint;
|
|
|
|
use crate::consensus::{Decodable, Encodable};
|
|
|
|
use crate::consensus::encode::VarInt;
|
|
|
|
use crate::util::endian;
|
2022-06-07 03:25:27 +00:00
|
|
|
use crate::internal_macros::write_err;
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
/// Golomb encoding parameter as in BIP-158, see also https://gist.github.com/sipa/576d5f09c3b86c3b1b75598d799fc845
|
|
|
|
const P: u8 = 19;
|
|
|
|
const M: u64 = 784931;
|
|
|
|
|
|
|
|
/// Errors for blockfilter
|
|
|
|
#[derive(Debug)]
|
|
|
|
pub enum Error {
|
|
|
|
/// missing UTXO, can not calculate script filter
|
|
|
|
UtxoMissing(OutPoint),
|
|
|
|
/// some IO error reading or writing binary serialization of the filter
|
|
|
|
Io(io::Error),
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Display for Error {
|
|
|
|
fn fmt(&self, f: &mut Formatter) -> Result<(), fmt::Error> {
|
|
|
|
match *self {
|
|
|
|
Error::UtxoMissing(ref coin) => write!(f, "unresolved UTXO {}", coin),
|
2022-05-25 02:56:51 +00:00
|
|
|
Error::Io(ref e) => write_err!(f, "IO error"; e),
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-05-04 05:08:33 +00:00
|
|
|
#[cfg(feature = "std")]
|
|
|
|
#[cfg_attr(docsrs, doc(cfg(feature = "std")))]
|
2022-05-04 05:56:24 +00:00
|
|
|
impl std::error::Error for Error {
|
|
|
|
fn source(&self) -> Option<&(dyn std::error::Error + 'static)> {
|
|
|
|
use self::Error::*;
|
|
|
|
|
|
|
|
match self {
|
|
|
|
UtxoMissing(_) => None,
|
|
|
|
Io(e) => Some(e),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-26 07:36:25 +00:00
|
|
|
impl From<io::Error> for Error {
|
|
|
|
fn from(io: io::Error) -> Self {
|
|
|
|
Error::Io(io)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// a computed or read block filter
|
2020-10-11 20:25:38 +00:00
|
|
|
#[derive(Debug, Clone, PartialEq, Eq)]
|
2019-07-26 07:36:25 +00:00
|
|
|
pub struct BlockFilter {
|
|
|
|
/// Golomb encoded filter
|
2019-08-09 14:58:02 +00:00
|
|
|
pub content: Vec<u8>
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
2020-08-07 12:23:35 +00:00
|
|
|
impl FilterHash {
|
|
|
|
/// compute the filter header from a filter hash and previous filter header
|
|
|
|
pub fn filter_header(&self, previous_filter_header: &FilterHeader) -> FilterHeader {
|
|
|
|
let mut header_data = [0u8; 64];
|
|
|
|
header_data[0..32].copy_from_slice(&self[..]);
|
|
|
|
header_data[32..64].copy_from_slice(&previous_filter_header[..]);
|
|
|
|
FilterHeader::hash(&header_data)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-26 07:36:25 +00:00
|
|
|
impl BlockFilter {
|
2022-08-09 04:26:38 +00:00
|
|
|
/// Creates a new filter from pre-computed data.
|
|
|
|
pub fn new (content: &[u8]) -> BlockFilter {
|
|
|
|
BlockFilter { content: content.to_vec() }
|
|
|
|
}
|
|
|
|
|
2022-08-09 05:04:27 +00:00
|
|
|
/// Computes a SCRIPT_FILTER that contains spent and output scripts.
|
|
|
|
pub fn new_script_filter<M>(block: &Block, script_for_coin: M) -> Result<BlockFilter, Error>
|
|
|
|
where
|
|
|
|
M: Fn(&OutPoint) -> Result<Script, Error>
|
|
|
|
{
|
|
|
|
let mut out = Vec::new();
|
|
|
|
let mut writer = BlockFilterWriter::new(&mut out, block);
|
|
|
|
|
|
|
|
writer.add_output_scripts();
|
|
|
|
writer.add_input_scripts(script_for_coin)?;
|
|
|
|
writer.finish()?;
|
|
|
|
|
|
|
|
Ok(BlockFilter { content: out })
|
|
|
|
}
|
|
|
|
|
2022-08-09 05:08:29 +00:00
|
|
|
/// Computes this filter's ID in a chain of filters (see [BIP 157]).
|
|
|
|
///
|
|
|
|
/// [BIP 157]: <https://github.com/bitcoin/bips/blob/master/bip-0157.mediawiki#Filter_Headers>
|
2020-08-07 12:23:35 +00:00
|
|
|
pub fn filter_header(&self, previous_filter_header: &FilterHeader) -> FilterHeader {
|
2019-12-06 09:01:15 +00:00
|
|
|
let filter_hash = FilterHash::hash(self.content.as_slice());
|
2020-08-07 12:23:35 +00:00
|
|
|
filter_hash.filter_header(previous_filter_header)
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// match any query pattern
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn match_any<'a, I>(&self, block_hash: &BlockHash, query: I) -> Result<bool, Error>
|
|
|
|
where
|
|
|
|
I: Iterator<Item = &'a [u8]>,
|
|
|
|
{
|
2019-08-09 14:58:02 +00:00
|
|
|
let filter_reader = BlockFilterReader::new(block_hash);
|
2022-08-08 05:30:26 +00:00
|
|
|
filter_reader.match_any(&mut self.content.as_slice(), query)
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// match all query pattern
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn match_all<'a, I>(&self, block_hash: &BlockHash, query: I) -> Result<bool, Error>
|
|
|
|
where
|
|
|
|
I: Iterator<Item = &'a [u8]>,
|
|
|
|
{
|
2019-08-09 14:58:02 +00:00
|
|
|
let filter_reader = BlockFilterReader::new(block_hash);
|
2022-08-08 05:30:26 +00:00
|
|
|
filter_reader.match_all(&mut self.content.as_slice(), query)
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Compiles and writes a block filter
|
2022-08-08 06:24:25 +00:00
|
|
|
pub struct BlockFilterWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
block: &'a Block,
|
2022-08-08 06:24:25 +00:00
|
|
|
writer: GCSFilterWriter<'a, W>,
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
2022-08-08 06:24:25 +00:00
|
|
|
impl<'a, W: io::Write> BlockFilterWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
/// Create a block filter writer
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn new(writer: &'a mut W, block: &'a Block) -> BlockFilterWriter<'a, W> {
|
2020-01-10 11:34:16 +00:00
|
|
|
let block_hash_as_int = block.block_hash().into_inner();
|
2019-10-17 21:40:45 +00:00
|
|
|
let k0 = endian::slice_to_u64_le(&block_hash_as_int[0..8]);
|
|
|
|
let k1 = endian::slice_to_u64_le(&block_hash_as_int[8..16]);
|
2019-07-26 07:36:25 +00:00
|
|
|
let writer = GCSFilterWriter::new(writer, k0, k1, M, P);
|
|
|
|
BlockFilterWriter { block, writer }
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Add output scripts of the block - excluding OP_RETURN scripts
|
|
|
|
pub fn add_output_scripts(&mut self) {
|
|
|
|
for transaction in &self.block.txdata {
|
|
|
|
for output in &transaction.output {
|
|
|
|
if !output.script_pubkey.is_op_return() {
|
|
|
|
self.add_element(output.script_pubkey.as_bytes());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Add consumed output scripts of a block to filter
|
|
|
|
pub fn add_input_scripts<M>(&mut self, script_for_coin: M) -> Result<(), Error>
|
|
|
|
where M: Fn(&OutPoint) -> Result<Script, Error> {
|
|
|
|
for script in self.block.txdata.iter()
|
|
|
|
.skip(1) // skip coinbase
|
|
|
|
.flat_map(|t| t.input.iter().map(|i| &i.previous_output))
|
|
|
|
.map(script_for_coin) {
|
|
|
|
match script {
|
|
|
|
Ok(script) => self.add_element(script.as_bytes()),
|
|
|
|
Err(e) => return Err(e)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Add arbitrary element to a filter
|
|
|
|
pub fn add_element(&mut self, data: &[u8]) {
|
|
|
|
self.writer.add_element(data);
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Write block filter
|
|
|
|
pub fn finish(&mut self) -> Result<usize, io::Error> {
|
|
|
|
self.writer.finish()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Reads and interpret a block filter
|
|
|
|
pub struct BlockFilterReader {
|
|
|
|
reader: GCSFilterReader
|
|
|
|
}
|
|
|
|
|
|
|
|
impl BlockFilterReader {
|
|
|
|
/// Create a block filter reader
|
2019-11-30 16:26:52 +00:00
|
|
|
pub fn new(block_hash: &BlockHash) -> BlockFilterReader {
|
2019-07-26 07:36:25 +00:00
|
|
|
let block_hash_as_int = block_hash.into_inner();
|
2019-10-17 21:40:45 +00:00
|
|
|
let k0 = endian::slice_to_u64_le(&block_hash_as_int[0..8]);
|
|
|
|
let k1 = endian::slice_to_u64_le(&block_hash_as_int[8..16]);
|
2019-07-26 07:36:25 +00:00
|
|
|
BlockFilterReader { reader: GCSFilterReader::new(k0, k1, M, P) }
|
|
|
|
}
|
|
|
|
|
|
|
|
/// match any query pattern
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn match_any<'a, I, R>(&self, reader: &mut R, query: I) -> Result<bool, Error>
|
|
|
|
where
|
|
|
|
I: Iterator<Item = &'a [u8]>,
|
|
|
|
R: io::Read + ?Sized,
|
|
|
|
{
|
2019-07-26 07:36:25 +00:00
|
|
|
self.reader.match_any(reader, query)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// match all query pattern
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn match_all<'a, I, R>(&self, reader: &mut R, query: I) -> Result<bool, Error>
|
|
|
|
where
|
|
|
|
I: Iterator<Item = &'a [u8]>,
|
|
|
|
R: io::Read + ?Sized,
|
|
|
|
{
|
2019-07-26 07:36:25 +00:00
|
|
|
self.reader.match_all(reader, query)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Golomb-Rice encoded filter reader
|
|
|
|
pub struct GCSFilterReader {
|
|
|
|
filter: GCSFilter,
|
|
|
|
m: u64
|
|
|
|
}
|
|
|
|
|
|
|
|
impl GCSFilterReader {
|
|
|
|
/// Create a new filter reader with specific seed to siphash
|
|
|
|
pub fn new(k0: u64, k1: u64, m: u64, p: u8) -> GCSFilterReader {
|
|
|
|
GCSFilterReader { filter: GCSFilter::new(k0, k1, p), m }
|
|
|
|
}
|
|
|
|
|
|
|
|
/// match any query pattern
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn match_any<'a, I, R>(&self, reader: &mut R, query: I) -> Result<bool, Error>
|
|
|
|
where
|
|
|
|
I: Iterator<Item = &'a [u8]>,
|
|
|
|
R: io::Read + ?Sized,
|
|
|
|
{
|
2019-07-26 07:36:25 +00:00
|
|
|
let mut decoder = reader;
|
|
|
|
let n_elements: VarInt = Decodable::consensus_decode(&mut decoder).unwrap_or(VarInt(0));
|
2019-08-05 18:52:34 +00:00
|
|
|
let reader = &mut decoder;
|
2019-07-26 07:36:25 +00:00
|
|
|
// map hashes to [0, n_elements << grp]
|
|
|
|
let nm = n_elements.0 * self.m;
|
|
|
|
let mut mapped = query.map(|e| map_to_range(self.filter.hash(e), nm)).collect::<Vec<_>>();
|
|
|
|
// sort
|
2021-11-03 09:20:34 +00:00
|
|
|
mapped.sort_unstable();
|
2019-07-26 07:36:25 +00:00
|
|
|
if mapped.is_empty() {
|
|
|
|
return Ok(true);
|
|
|
|
}
|
|
|
|
if n_elements.0 == 0 {
|
|
|
|
return Ok(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
// find first match in two sorted arrays in one read pass
|
|
|
|
let mut reader = BitStreamReader::new(reader);
|
|
|
|
let mut data = self.filter.golomb_rice_decode(&mut reader)?;
|
|
|
|
let mut remaining = n_elements.0 - 1;
|
|
|
|
for p in mapped {
|
|
|
|
loop {
|
2019-08-05 19:41:07 +00:00
|
|
|
match data.cmp(&p) {
|
|
|
|
Ordering::Equal => return Ok(true),
|
|
|
|
Ordering::Less => {
|
|
|
|
if remaining > 0 {
|
|
|
|
data += self.filter.golomb_rice_decode(&mut reader)?;
|
|
|
|
remaining -= 1;
|
|
|
|
} else {
|
|
|
|
return Ok(false);
|
|
|
|
}
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
2019-08-05 19:41:07 +00:00
|
|
|
Ordering::Greater => break,
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(false)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// match all query pattern
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn match_all<'a, I, R>(&self, reader: &mut R, query: I) -> Result<bool, Error>
|
|
|
|
where
|
|
|
|
I: Iterator<Item = &'a [u8]>,
|
|
|
|
R: io::Read + ?Sized,
|
|
|
|
{
|
2019-07-26 07:36:25 +00:00
|
|
|
let mut decoder = reader;
|
|
|
|
let n_elements: VarInt = Decodable::consensus_decode(&mut decoder).unwrap_or(VarInt(0));
|
2019-08-05 18:52:34 +00:00
|
|
|
let reader = &mut decoder;
|
2019-07-26 07:36:25 +00:00
|
|
|
// map hashes to [0, n_elements << grp]
|
|
|
|
let nm = n_elements.0 * self.m;
|
|
|
|
let mut mapped = query.map(|e| map_to_range(self.filter.hash(e), nm)).collect::<Vec<_>>();
|
|
|
|
// sort
|
2021-11-03 09:20:34 +00:00
|
|
|
mapped.sort_unstable();
|
2019-07-26 07:36:25 +00:00
|
|
|
mapped.dedup();
|
|
|
|
if mapped.is_empty() {
|
|
|
|
return Ok(true);
|
|
|
|
}
|
|
|
|
if n_elements.0 == 0 {
|
|
|
|
return Ok(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
// figure if all mapped are there in one read pass
|
|
|
|
let mut reader = BitStreamReader::new(reader);
|
|
|
|
let mut data = self.filter.golomb_rice_decode(&mut reader)?;
|
|
|
|
let mut remaining = n_elements.0 - 1;
|
|
|
|
for p in mapped {
|
|
|
|
loop {
|
2019-08-05 19:41:07 +00:00
|
|
|
match data.cmp(&p) {
|
|
|
|
Ordering::Equal => break,
|
|
|
|
Ordering::Less => {
|
|
|
|
if remaining > 0 {
|
|
|
|
data += self.filter.golomb_rice_decode(&mut reader)?;
|
|
|
|
remaining -= 1;
|
|
|
|
} else {
|
|
|
|
return Ok(false);
|
|
|
|
}
|
|
|
|
},
|
|
|
|
Ordering::Greater => return Ok(false),
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(true)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// fast reduction of hash to [0, nm) range
|
|
|
|
fn map_to_range(hash: u64, nm: u64) -> u64 {
|
2020-10-05 07:21:40 +00:00
|
|
|
((hash as u128 * nm as u128) >> 64) as u64
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Colomb-Rice encoded filter writer
|
2022-08-08 06:24:25 +00:00
|
|
|
pub struct GCSFilterWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
filter: GCSFilter,
|
2022-08-08 06:24:25 +00:00
|
|
|
writer: &'a mut W,
|
2019-07-26 07:36:25 +00:00
|
|
|
elements: HashSet<Vec<u8>>,
|
|
|
|
m: u64
|
|
|
|
}
|
|
|
|
|
2022-08-08 06:24:25 +00:00
|
|
|
impl<'a, W: io::Write> GCSFilterWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
/// Create a new GCS writer wrapping a generic writer, with specific seed to siphash
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn new(writer: &'a mut W, k0: u64, k1: u64, m: u64, p: u8) -> GCSFilterWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
GCSFilterWriter {
|
|
|
|
filter: GCSFilter::new(k0, k1, p),
|
|
|
|
writer,
|
|
|
|
elements: HashSet::new(),
|
|
|
|
m
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Add some data to the filter
|
|
|
|
pub fn add_element(&mut self, element: &[u8]) {
|
|
|
|
if !element.is_empty() {
|
|
|
|
self.elements.insert(element.to_vec());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// write the filter to the wrapped writer
|
|
|
|
pub fn finish(&mut self) -> Result<usize, io::Error> {
|
|
|
|
let nm = self.elements.len() as u64 * self.m;
|
|
|
|
|
|
|
|
// map hashes to [0, n_elements * M)
|
|
|
|
let mut mapped: Vec<_> = self.elements.iter()
|
|
|
|
.map(|e| map_to_range(self.filter.hash(e.as_slice()), nm)).collect();
|
2021-11-03 09:20:34 +00:00
|
|
|
mapped.sort_unstable();
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
// write number of elements as varint
|
2022-07-28 21:02:06 +00:00
|
|
|
let mut wrote = VarInt(mapped.len() as u64).consensus_encode(&mut self.writer)?;
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
// write out deltas of sorted values into a Golonb-Rice coded bit stream
|
|
|
|
let mut writer = BitStreamWriter::new(self.writer);
|
|
|
|
let mut last = 0;
|
|
|
|
for data in mapped {
|
|
|
|
wrote += self.filter.golomb_rice_encode(&mut writer, data - last)?;
|
|
|
|
last = data;
|
|
|
|
}
|
|
|
|
wrote += writer.flush()?;
|
|
|
|
Ok(wrote)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Golomb Coded Set Filter
|
|
|
|
struct GCSFilter {
|
|
|
|
k0: u64, // sip hash key
|
|
|
|
k1: u64, // sip hash key
|
|
|
|
p: u8
|
|
|
|
}
|
|
|
|
|
|
|
|
impl GCSFilter {
|
|
|
|
/// Create a new filter
|
|
|
|
fn new(k0: u64, k1: u64, p: u8) -> GCSFilter {
|
|
|
|
GCSFilter { k0, k1, p }
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Golomb-Rice encode a number n to a bit stream (Parameter 2^k)
|
2022-08-08 06:24:25 +00:00
|
|
|
fn golomb_rice_encode<'a, W>(&self, writer: &mut BitStreamWriter<'a, W>, n: u64) -> Result<usize, io::Error>
|
|
|
|
where
|
|
|
|
W: io::Write,
|
|
|
|
{
|
2019-07-26 07:36:25 +00:00
|
|
|
let mut wrote = 0;
|
|
|
|
let mut q = n >> self.p;
|
|
|
|
while q > 0 {
|
|
|
|
let nbits = cmp::min(q, 64);
|
|
|
|
wrote += writer.write(!0u64, nbits as u8)?;
|
|
|
|
q -= nbits;
|
|
|
|
}
|
|
|
|
wrote += writer.write(0, 1)?;
|
|
|
|
wrote += writer.write(n, self.p)?;
|
|
|
|
Ok(wrote)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Golomb-Rice decode a number from a bit stream (Parameter 2^k)
|
2022-08-08 06:24:25 +00:00
|
|
|
fn golomb_rice_decode<R>(&self, reader: &mut BitStreamReader<R>) -> Result<u64, io::Error>
|
|
|
|
where
|
|
|
|
R: io::Read
|
|
|
|
{
|
2019-07-26 07:36:25 +00:00
|
|
|
let mut q = 0u64;
|
|
|
|
while reader.read(1)? == 1 {
|
|
|
|
q += 1;
|
|
|
|
}
|
|
|
|
let r = reader.read(self.p)?;
|
2019-08-05 19:41:07 +00:00
|
|
|
Ok((q << self.p) + r)
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
2019-08-04 19:27:36 +00:00
|
|
|
/// Hash an arbitrary slice with siphash using parameters of this filter
|
2019-07-26 07:36:25 +00:00
|
|
|
fn hash(&self, element: &[u8]) -> u64 {
|
|
|
|
siphash24::Hash::hash_to_u64_with_keys(self.k0, self.k1, element)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Bitwise stream reader
|
2022-08-08 06:24:25 +00:00
|
|
|
pub struct BitStreamReader<'a, R> {
|
2019-07-26 07:36:25 +00:00
|
|
|
buffer: [u8; 1],
|
|
|
|
offset: u8,
|
2022-08-08 06:24:25 +00:00
|
|
|
reader: &'a mut R,
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
2022-08-08 06:24:25 +00:00
|
|
|
impl<'a, R: io::Read> BitStreamReader<'a, R> {
|
2019-07-26 07:36:25 +00:00
|
|
|
/// Create a new BitStreamReader that reads bitwise from a given reader
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn new(reader: &'a mut R) -> BitStreamReader<'a, R> {
|
2019-07-26 07:36:25 +00:00
|
|
|
BitStreamReader {
|
|
|
|
buffer: [0u8],
|
2021-11-03 09:20:34 +00:00
|
|
|
reader,
|
2019-07-26 07:36:25 +00:00
|
|
|
offset: 8,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Read nbit bits
|
|
|
|
pub fn read(&mut self, mut nbits: u8) -> Result<u64, io::Error> {
|
|
|
|
if nbits > 64 {
|
|
|
|
return Err(io::Error::new(io::ErrorKind::Other, "can not read more than 64 bits at once"));
|
|
|
|
}
|
|
|
|
let mut data = 0u64;
|
|
|
|
while nbits > 0 {
|
|
|
|
if self.offset == 8 {
|
|
|
|
self.reader.read_exact(&mut self.buffer)?;
|
|
|
|
self.offset = 0;
|
|
|
|
}
|
|
|
|
let bits = cmp::min(8 - self.offset, nbits);
|
|
|
|
data <<= bits;
|
|
|
|
data |= ((self.buffer[0] << self.offset) >> (8 - bits)) as u64;
|
|
|
|
self.offset += bits;
|
|
|
|
nbits -= bits;
|
|
|
|
}
|
|
|
|
Ok(data)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Bitwise stream writer
|
2022-08-08 06:24:25 +00:00
|
|
|
pub struct BitStreamWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
buffer: [u8; 1],
|
|
|
|
offset: u8,
|
2022-08-08 06:24:25 +00:00
|
|
|
writer: &'a mut W,
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
|
2022-08-08 06:24:25 +00:00
|
|
|
impl<'a, W: io::Write> BitStreamWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
/// Create a new BitStreamWriter that writes bitwise to a given writer
|
2022-08-08 06:24:25 +00:00
|
|
|
pub fn new(writer: &'a mut W) -> BitStreamWriter<'a, W> {
|
2019-07-26 07:36:25 +00:00
|
|
|
BitStreamWriter {
|
|
|
|
buffer: [0u8],
|
2021-11-03 09:20:34 +00:00
|
|
|
writer,
|
2019-07-26 07:36:25 +00:00
|
|
|
offset: 0,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Write nbits bits from data
|
|
|
|
pub fn write(&mut self, data: u64, mut nbits: u8) -> Result<usize, io::Error> {
|
|
|
|
if nbits > 64 {
|
|
|
|
return Err(io::Error::new(io::ErrorKind::Other, "can not write more than 64 bits at once"));
|
|
|
|
}
|
|
|
|
let mut wrote = 0;
|
|
|
|
while nbits > 0 {
|
|
|
|
let bits = cmp::min(8 - self.offset, nbits);
|
|
|
|
self.buffer[0] |= ((data << (64 - nbits)) >> (64 - 8 + self.offset)) as u8;
|
|
|
|
self.offset += bits;
|
|
|
|
nbits -= bits;
|
|
|
|
if self.offset == 8 {
|
|
|
|
wrote += self.flush()?;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(wrote)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// flush bits not yet written
|
|
|
|
pub fn flush(&mut self) -> Result<usize, io::Error> {
|
|
|
|
if self.offset > 0 {
|
|
|
|
self.writer.write_all(&self.buffer)?;
|
|
|
|
self.buffer[0] = 0u8;
|
|
|
|
self.offset = 0;
|
|
|
|
Ok(1)
|
|
|
|
} else {
|
|
|
|
Ok(0)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod test {
|
2022-05-02 22:13:57 +00:00
|
|
|
use crate::hash_types::BlockHash;
|
|
|
|
use crate::hashes::hex::FromHex;
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
extern crate serde_json;
|
2022-01-24 01:40:10 +00:00
|
|
|
use self::serde_json::Value;
|
2019-07-26 07:36:25 +00:00
|
|
|
|
2022-05-02 22:13:57 +00:00
|
|
|
use crate::consensus::encode::deserialize;
|
2021-06-09 10:34:44 +00:00
|
|
|
use std::collections::HashMap;
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_blockfilters() {
|
|
|
|
|
|
|
|
// test vectors from: https://github.com/jimpo/bitcoin/blob/c7efb652f3543b001b4dd22186a354605b14f47e/src/test/data/blockfilters.json
|
2021-12-31 10:19:35 +00:00
|
|
|
let data = include_str!("../../test_data/blockfilters.json");
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
let testdata = serde_json::from_str::<Value>(data).unwrap().as_array().unwrap().clone();
|
|
|
|
for t in testdata.iter().skip(1) {
|
2022-06-07 05:07:59 +00:00
|
|
|
let block_hash = BlockHash::from_hex(t.get(1).unwrap().as_str().unwrap()).unwrap();
|
|
|
|
let block: Block = deserialize(&Vec::from_hex(t.get(2).unwrap().as_str().unwrap()).unwrap()).unwrap();
|
2020-01-10 11:34:16 +00:00
|
|
|
assert_eq!(block.block_hash(), block_hash);
|
2019-07-26 07:36:25 +00:00
|
|
|
let scripts = t.get(3).unwrap().as_array().unwrap();
|
2022-06-07 05:07:59 +00:00
|
|
|
let previous_filter_header = FilterHeader::from_hex(t.get(4).unwrap().as_str().unwrap()).unwrap();
|
|
|
|
let filter_content = Vec::from_hex(t.get(5).unwrap().as_str().unwrap()).unwrap();
|
|
|
|
let filter_header = FilterHeader::from_hex(t.get(6).unwrap().as_str().unwrap()).unwrap();
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
let mut txmap = HashMap::new();
|
|
|
|
let mut si = scripts.iter();
|
|
|
|
for tx in block.txdata.iter().skip(1) {
|
|
|
|
for input in tx.input.iter() {
|
2022-06-07 05:09:58 +00:00
|
|
|
txmap.insert(input.previous_output, Script::from(Vec::from_hex(si.next().unwrap().as_str().unwrap()).unwrap()));
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let filter = BlockFilter::new_script_filter(&block,
|
|
|
|
|o| if let Some(s) = txmap.get(o) {
|
|
|
|
Ok(s.clone())
|
|
|
|
} else {
|
2022-06-07 05:09:58 +00:00
|
|
|
Err(Error::UtxoMissing(*o))
|
2019-07-26 07:36:25 +00:00
|
|
|
}).unwrap();
|
|
|
|
|
2019-08-09 14:58:02 +00:00
|
|
|
let test_filter = BlockFilter::new(filter_content.as_slice());
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
assert_eq!(test_filter.content, filter.content);
|
|
|
|
|
2020-01-10 11:34:16 +00:00
|
|
|
let block_hash = &block.block_hash();
|
2019-11-30 16:26:52 +00:00
|
|
|
assert!(filter.match_all(block_hash, &mut txmap.iter()
|
2019-07-26 07:36:25 +00:00
|
|
|
.filter_map(|(_, s)| if !s.is_empty() { Some(s.as_bytes()) } else { None })).unwrap());
|
|
|
|
|
2022-06-07 05:21:29 +00:00
|
|
|
for script in txmap.values() {
|
2019-07-26 07:36:25 +00:00
|
|
|
let query = vec![script];
|
|
|
|
if !script.is_empty () {
|
2022-06-07 05:07:59 +00:00
|
|
|
assert!(filter.match_any(block_hash, &mut query.iter()
|
2019-07-26 07:36:25 +00:00
|
|
|
.map(|s| s.as_bytes())).unwrap());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-07 12:23:35 +00:00
|
|
|
assert_eq!(filter_header, filter.filter_header(&previous_filter_header));
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
2022-01-24 00:26:29 +00:00
|
|
|
fn test_filter() {
|
2019-07-26 07:36:25 +00:00
|
|
|
let mut patterns = HashSet::new();
|
|
|
|
|
2020-09-14 14:39:11 +00:00
|
|
|
patterns.insert(Vec::from_hex("000000").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("111111").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("222222").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("333333").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("444444").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("555555").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("666666").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("777777").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("888888").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("999999").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("aaaaaa").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("bbbbbb").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("cccccc").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("dddddd").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("eeeeee").unwrap());
|
|
|
|
patterns.insert(Vec::from_hex("ffffff").unwrap());
|
2019-07-26 07:36:25 +00:00
|
|
|
|
2021-06-09 10:34:44 +00:00
|
|
|
let mut out = Vec::new();
|
2019-07-26 07:36:25 +00:00
|
|
|
{
|
|
|
|
let mut writer = GCSFilterWriter::new(&mut out, 0, 0, M, P);
|
|
|
|
for p in &patterns {
|
|
|
|
writer.add_element(p.as_slice());
|
|
|
|
}
|
|
|
|
writer.finish().unwrap();
|
|
|
|
}
|
|
|
|
|
2021-06-09 10:34:44 +00:00
|
|
|
let bytes = out;
|
2019-07-26 07:36:25 +00:00
|
|
|
|
|
|
|
{
|
2022-06-07 05:23:35 +00:00
|
|
|
let query = vec![Vec::from_hex("abcdef").unwrap(), Vec::from_hex("eeeeee").unwrap()];
|
2019-07-26 07:36:25 +00:00
|
|
|
let reader = GCSFilterReader::new(0, 0, M, P);
|
2022-08-08 05:30:26 +00:00
|
|
|
assert!(reader.match_any(&mut bytes.as_slice(), &mut query.iter().map(|v| v.as_slice())).unwrap());
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
{
|
2022-06-07 05:23:35 +00:00
|
|
|
let query = vec![Vec::from_hex("abcdef").unwrap(), Vec::from_hex("123456").unwrap()];
|
2019-07-26 07:36:25 +00:00
|
|
|
let reader = GCSFilterReader::new(0, 0, M, P);
|
2022-08-08 05:30:26 +00:00
|
|
|
assert!(!reader.match_any(&mut bytes.as_slice(), &mut query.iter().map(|v| v.as_slice())).unwrap());
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
{
|
|
|
|
let reader = GCSFilterReader::new(0, 0, M, P);
|
|
|
|
let mut query = Vec::new();
|
|
|
|
for p in &patterns {
|
|
|
|
query.push(p.clone());
|
|
|
|
}
|
2022-08-08 05:30:26 +00:00
|
|
|
assert!(reader.match_all(&mut bytes.as_slice(), &mut query.iter().map(|v| v.as_slice())).unwrap());
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
{
|
|
|
|
let reader = GCSFilterReader::new(0, 0, M, P);
|
|
|
|
let mut query = Vec::new();
|
|
|
|
for p in &patterns {
|
|
|
|
query.push(p.clone());
|
|
|
|
}
|
2020-09-14 14:39:11 +00:00
|
|
|
query.push(Vec::from_hex("abcdef").unwrap());
|
2022-08-08 05:30:26 +00:00
|
|
|
assert!(!reader.match_all(&mut bytes.as_slice(), &mut query.iter().map(|v| v.as_slice())).unwrap());
|
2019-07-26 07:36:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_bit_stream() {
|
2021-06-09 10:34:44 +00:00
|
|
|
let mut out = Vec::new();
|
2019-07-26 07:36:25 +00:00
|
|
|
{
|
|
|
|
let mut writer = BitStreamWriter::new(&mut out);
|
|
|
|
writer.write(0, 1).unwrap(); // 0
|
|
|
|
writer.write(2, 2).unwrap(); // 10
|
|
|
|
writer.write(6, 3).unwrap(); // 110
|
|
|
|
writer.write(11, 4).unwrap(); // 1011
|
|
|
|
writer.write(1, 5).unwrap(); // 00001
|
|
|
|
writer.write(32, 6).unwrap(); // 100000
|
|
|
|
writer.write(7, 7).unwrap(); // 0000111
|
|
|
|
writer.flush().unwrap();
|
|
|
|
}
|
2021-06-09 10:34:44 +00:00
|
|
|
let bytes = out;
|
2019-07-26 07:36:25 +00:00
|
|
|
assert_eq!("01011010110000110000000001110000", format!("{:08b}{:08b}{:08b}{:08b}", bytes[0], bytes[1], bytes[2], bytes[3]));
|
|
|
|
{
|
2022-08-08 05:30:26 +00:00
|
|
|
let mut input = bytes.as_slice();
|
2019-07-26 07:36:25 +00:00
|
|
|
let mut reader = BitStreamReader::new(&mut input);
|
|
|
|
assert_eq!(reader.read(1).unwrap(), 0);
|
|
|
|
assert_eq!(reader.read(2).unwrap(), 2);
|
|
|
|
assert_eq!(reader.read(3).unwrap(), 6);
|
|
|
|
assert_eq!(reader.read(4).unwrap(), 11);
|
|
|
|
assert_eq!(reader.read(5).unwrap(), 1);
|
|
|
|
assert_eq!(reader.read(6).unwrap(), 32);
|
|
|
|
assert_eq!(reader.read(7).unwrap(), 7);
|
|
|
|
// 4 bits remained
|
|
|
|
assert!(reader.read(5).is_err());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|