fix major bug: re-used blobs need to have their flags cleared

plus: lots of additional debug-ability
This commit is contained in:
Rob Walker
2018-07-23 18:55:58 -07:00
parent 54f2146429
commit f11e60b801
4 changed files with 486 additions and 262 deletions

View File

@ -506,19 +506,6 @@ impl Crdt {
} }
} }
pub fn index_blobs(me: &NodeInfo, blobs: &[SharedBlob], receive_index: &mut u64) -> Result<()> {
// enumerate all the blobs, those are the indices
trace!("{:x}: INDEX_BLOBS {}", me.debug_id(), blobs.len());
for (i, b) in blobs.iter().enumerate() {
// only leader should be broadcasting
let mut blob = b.write().expect("'blob' write lock in crdt::index_blobs");
blob.set_id(me.id).expect("set_id in pub fn broadcast");
blob.set_index(*receive_index + i as u64)
.expect("set_index in pub fn broadcast");
}
Ok(())
}
/// compute broadcast table /// compute broadcast table
/// # Remarks /// # Remarks
pub fn compute_broadcast_table(&self) -> Vec<NodeInfo> { pub fn compute_broadcast_table(&self) -> Vec<NodeInfo> {

View File

@ -1,6 +1,7 @@
// Support erasure coding // Support erasure coding
use packet::{BlobRecycler, SharedBlob, BLOB_HEADER_SIZE}; use packet::{BlobRecycler, SharedBlob, BLOB_HEADER_SIZE, BLOB_SIZE};
use std::cmp; use std::cmp;
use std::mem;
use std::result; use std::result;
use streamer::WindowSlot; use streamer::WindowSlot;
@ -179,7 +180,33 @@ pub fn decode_blocks(
// +---+ +---+ +---+ +---+ +---+ . . . +---+ +---+ +---+ +---+ +---+ // +---+ +---+ +---+ +---+ +---+ . . . +---+ +---+ +---+ +---+ +---+
// | | | | | | | | | | | | | C | | C | | C | | C | // | | | | | | | | | | | | | C | | C | | C | | C |
// +---+ +---+ +---+ +---+ +---+ +---+ +---+ +---+ +---+ +---+ // +---+ +---+ +---+ +---+ +---+ +---+ +---+ +---+ +---+ +---+
//
// blob structure for coding, recover
//
// + ------- meta is set and used by transport, meta.size is actual length
// | of data in the byte array blob.data
// |
// | + -- data is stuff shipped over the wire, and has an included
// | | header
// V V
// +----------+------------------------------------------------------------+
// | meta | data |
// |+---+-- |+---+---+---+---+------------------------------------------+|
// || s | . || i | | f | s | ||
// || i | . || n | i | l | i | ||
// || z | . || d | d | a | z | blob.data(), or blob.data_mut() ||
// || e | || e | | g | e | ||
// |+---+-- || x | | s | | ||
// | |+---+---+---+---+------------------------------------------+|
// +----------+------------------------------------------------------------+
// | |<=== coding blob part for "coding" =======>|
// | |
// |<============== data blob part for "coding" ==============>|
//
//
//
pub fn generate_coding( pub fn generate_coding(
debug_id: u64,
window: &mut [WindowSlot], window: &mut [WindowSlot],
recycler: &BlobRecycler, recycler: &BlobRecycler,
start_idx: usize, start_idx: usize,
@ -188,41 +215,39 @@ pub fn generate_coding(
let mut block_start = start_idx - (start_idx % NUM_DATA); let mut block_start = start_idx - (start_idx % NUM_DATA);
loop { loop {
if (block_start + NUM_DATA) > (start_idx + num_blobs) { let block_end = block_start + NUM_DATA;
if block_end > (start_idx + num_blobs) {
break; break;
} }
info!( info!(
"generate_coding start: {} end: {} start_idx: {} num_blobs: {}", "generate_coding {:x} start: {} end: {} start_idx: {} num_blobs: {}",
block_start, debug_id, block_start, block_end, start_idx, num_blobs
block_start + NUM_DATA,
start_idx,
num_blobs
); );
let mut data_blobs = Vec::with_capacity(NUM_DATA);
let mut max_data_size = 0; let mut max_data_size = 0;
// find max_data_size, maybe bail if not all the data is here // find max_data_size, maybe bail if not all the data is here
for i in block_start..block_start + NUM_DATA { for i in block_start..block_end {
let n = i % window.len(); let n = i % window.len();
trace!("window[{}] = {:?}", n, window[n].data); trace!("{:x} window[{}] = {:?}", debug_id, n, window[n].data);
if let Some(b) = &window[n].data { if let Some(b) = &window[n].data {
max_data_size = cmp::max(b.read().unwrap().meta.size, max_data_size); max_data_size = cmp::max(b.read().unwrap().meta.size, max_data_size);
} else { } else {
trace!("data block is null @ {}", n); trace!("{:x} data block is null @ {}", debug_id, n);
return Ok(()); return Ok(());
} }
} }
trace!("max_data_size: {}", max_data_size); trace!("{:x} max_data_size: {}", debug_id, max_data_size);
// make sure extra bytes in each blob are zero-d out for generation of let mut data_blobs = Vec::with_capacity(NUM_DATA);
// coding blobs for i in block_start..block_end {
for i in block_start..block_start + NUM_DATA {
let n = i % window.len(); let n = i % window.len();
if let Some(b) = &window[n].data { if let Some(b) = &window[n].data {
// make sure extra bytes in each blob are zero-d out for generation of
// coding blobs
let mut b_wl = b.write().unwrap(); let mut b_wl = b.write().unwrap();
for i in b_wl.meta.size..max_data_size { for i in b_wl.meta.size..max_data_size {
b_wl.data[i] = 0; b_wl.data[i] = 0;
@ -233,38 +258,43 @@ pub fn generate_coding(
let mut coding_blobs = Vec::with_capacity(NUM_CODING); let mut coding_blobs = Vec::with_capacity(NUM_CODING);
let coding_start = block_start + NUM_DATA - NUM_CODING; let coding_start = block_end - NUM_CODING;
let coding_end = block_start + NUM_DATA;
for i in coding_start..coding_end { for i in coding_start..block_end {
let n = i % window.len(); let n = i % window.len();
if window[n].coding.is_none() { assert!(window[n].coding.is_none());
window[n].coding = Some(recycler.allocate()); window[n].coding = Some(recycler.allocate());
}
let coding = window[n].coding.clone().unwrap(); let coding = window[n].coding.clone().unwrap();
let mut coding_wl = coding.write().unwrap(); let mut coding_wl = coding.write().unwrap();
{ for i in 0..max_data_size {
coding_wl.data[i] = 0;
}
// copy index and id from the data blob // copy index and id from the data blob
let data = window[n].data.clone().unwrap(); if let Some(data) = &window[n].data {
let data_rl = data.read().unwrap(); let data_rl = data.read().unwrap();
coding_wl.set_index(data_rl.get_index().unwrap()).unwrap();
coding_wl.set_id(data_rl.get_id().unwrap()).unwrap(); let index = data_rl.get_index().unwrap();
let id = data_rl.get_id().unwrap();
trace!(
"{:x} copying index {} id {:?} from data to coding",
debug_id,
index,
id
);
coding_wl.set_index(index).unwrap();
coding_wl.set_id(id).unwrap();
} }
coding_wl.set_size(max_data_size); coding_wl.set_size(max_data_size);
if coding_wl.set_coding().is_err() { if coding_wl.set_coding().is_err() {
return Err(ErasureError::EncodeError); return Err(ErasureError::EncodeError);
} }
coding_blobs.push( coding_blobs.push(coding.clone());
window[n]
.coding
.clone()
.expect("'coding_blobs' arr in pub fn generate_coding"),
);
} }
trace!("max_data_size {}", max_data_size);
let mut data_locks = Vec::with_capacity(NUM_DATA); let mut data_locks = Vec::with_capacity(NUM_DATA);
for b in &data_blobs { for b in &data_blobs {
data_locks.push( data_locks.push(
@ -275,7 +305,7 @@ pub fn generate_coding(
let mut data_ptrs: Vec<&[u8]> = Vec::with_capacity(NUM_DATA); let mut data_ptrs: Vec<&[u8]> = Vec::with_capacity(NUM_DATA);
for (i, l) in data_locks.iter_mut().enumerate() { for (i, l) in data_locks.iter_mut().enumerate() {
trace!("i: {} data: {}", i, l.data[0]); trace!("{:x} i: {} data: {}", debug_id, i, l.data[0]);
data_ptrs.push(&l.data[..max_data_size]); data_ptrs.push(&l.data[..max_data_size]);
} }
@ -289,36 +319,110 @@ pub fn generate_coding(
let mut coding_ptrs: Vec<&mut [u8]> = Vec::with_capacity(NUM_CODING); let mut coding_ptrs: Vec<&mut [u8]> = Vec::with_capacity(NUM_CODING);
for (i, l) in coding_locks.iter_mut().enumerate() { for (i, l) in coding_locks.iter_mut().enumerate() {
trace!("i: {} coding: {} size: {}", i, l.data[0], max_data_size); trace!(
"{:x} i: {} coding: {} size: {}",
debug_id,
i,
l.data[0],
max_data_size
);
coding_ptrs.push(&mut l.data_mut()[..max_data_size]); coding_ptrs.push(&mut l.data_mut()[..max_data_size]);
} }
generate_coding_blocks(coding_ptrs.as_mut_slice(), &data_ptrs)?; generate_coding_blocks(coding_ptrs.as_mut_slice(), &data_ptrs)?;
debug!( debug!(
"start_idx: {} data: {}:{} coding: {}:{}", "{:x} start_idx: {} data: {}:{} coding: {}:{}",
start_idx, debug_id, start_idx, block_start, block_end, coding_start, block_end
block_start,
block_start + NUM_DATA,
coding_start,
coding_end
); );
block_start += NUM_DATA; block_start = block_end;
} }
Ok(()) Ok(())
} }
// examine the window beginning at block_start for missing or
// stale (based on block_start_idx) blobs
// if a blob is stale, remove it from the window slot
fn find_missing(
debug_id: u64,
block_start_idx: u64,
block_start: usize,
window: &mut [WindowSlot],
recycler: &BlobRecycler,
) -> (usize, usize) {
let mut data_missing = 0;
let mut coding_missing = 0;
let block_end = block_start + NUM_DATA;
let coding_start = block_start + NUM_DATA - NUM_CODING;
// count missing blobs in the block
for i in block_start..block_end {
let idx = (i - block_start) as u64 + block_start_idx;
let n = i % window.len();
// swap blob out with None, if it's in the right place, put it back
if let Some(blob) = mem::replace(&mut window[n].data, None) {
let blob_idx = blob.read().unwrap().get_index().unwrap();
if blob_idx == idx {
trace!("recover {:x}: idx: {} good data", debug_id, idx);
mem::replace(&mut window[n].data, Some(blob));
} else {
trace!(
"recover {:x}: idx: {} old data {}, recycling",
debug_id,
idx,
blob_idx
);
recycler.recycle(blob);
data_missing += 1;
}
} else {
trace!("recover {:x}: idx: {} None data", debug_id, idx);
data_missing += 1;
}
if i >= coding_start {
// swap blob out with None, if it's in the right place, put it back
if let Some(blob) = mem::replace(&mut window[n].coding, None) {
let blob_idx = blob.read().unwrap().get_index().unwrap();
if blob_idx == idx {
trace!("recover {:x}: idx: {} good coding", debug_id, idx);
mem::replace(&mut window[n].coding, Some(blob));
} else {
trace!(
"recover {:x}: idx: {} old coding {}, recycling",
debug_id,
idx,
blob_idx
);
recycler.recycle(blob);
coding_missing += 1;
}
} else {
trace!("recover {:x}: idx: {} None coding", debug_id, idx);
coding_missing += 1;
}
}
}
(data_missing, coding_missing)
}
// Recover missing blocks into window // Recover missing blocks into window
// missing blocks should be None, will use re // missing blocks should be None or old...
// to allocate new ones. Returns err if not enough // Use recycler to allocate new ones.
// coding blocks are present to restore // If not enough coding or data blocks are present to restore
// any of the blocks, the block is skipped.
// Side effect: old blobs in a block are None'd
pub fn recover( pub fn recover(
debug_id: u64,
recycler: &BlobRecycler, recycler: &BlobRecycler,
window: &mut [WindowSlot], window: &mut [WindowSlot],
start_idx: u64,
start: usize, start: usize,
num_blobs: usize, num_blobs: usize,
) -> Result<()> { ) -> Result<()> {
let num_blocks = (num_blobs / NUM_DATA) + 1; let num_blocks = (num_blobs / NUM_DATA) + 1;
let mut block_start = start - (start % NUM_DATA); let mut block_start = start - (start % NUM_DATA);
let mut block_start_idx = start_idx - (start_idx % NUM_DATA as u64);
debug!( debug!(
"num_blocks: {} start: {} num_blobs: {} block_start: {}", "num_blocks: {} start: {} num_blobs: {} block_start: {}",
@ -326,39 +430,37 @@ pub fn recover(
); );
for _ in 0..num_blocks { for _ in 0..num_blocks {
let mut data_missing = 0;
let mut coding_missing = 0;
let coding_start = block_start + NUM_DATA - NUM_CODING; let coding_start = block_start + NUM_DATA - NUM_CODING;
let coding_end = block_start + NUM_DATA; let block_end = block_start + NUM_DATA;
trace!( trace!(
"recover: block_start: {} coding_start: {} coding_end: {}", "recover {:x}: block_start_idx: {} block_start: {} coding_start: {} block_end: {}",
debug_id,
block_start_idx,
block_start, block_start,
coding_start, coding_start,
coding_end block_end
); );
for i in block_start..coding_end {
let n = i % window.len(); let (data_missing, coding_missing) =
if window[n].coding.is_none() && i >= coding_start { find_missing(debug_id, block_start_idx, block_start, window, recycler);
coding_missing += 1;
}
if window[n].data.is_none() {
data_missing += 1;
}
}
// if we're not missing data, or if we have too much missin but have enough coding // if we're not missing data, or if we have too much missin but have enough coding
if data_missing == 0 || (data_missing + coding_missing) > NUM_CODING { if data_missing == 0 || (data_missing + coding_missing) > NUM_CODING {
trace!( trace!(
"1: start: {} skipping recovery data: {} coding: {}", "recover {:x}: start: {} skipping recovery data: {} coding: {}",
debug_id,
block_start, block_start,
data_missing, data_missing,
coding_missing coding_missing
); );
block_start += NUM_DATA; block_start += NUM_DATA;
block_start_idx += NUM_DATA as u64;
// on to the next block
continue; continue;
} }
trace!( trace!(
"2: recovering: data: {} coding: {}", "recover {:x}: recovering: data: {} coding: {}",
debug_id,
data_missing, data_missing,
coding_missing coding_missing
); );
@ -369,13 +471,13 @@ pub fn recover(
let mut size = None; let mut size = None;
// add the data blobs we have into recovery blob vector // add the data blobs we have into recovery blob vector
for i in block_start..coding_end { for i in block_start..block_end {
let j = i % window.len(); let j = i % window.len();
if let Some(b) = window[j].data.clone() { if let Some(b) = window[j].data.clone() {
if meta.is_none() { if meta.is_none() {
meta = Some(b.read().unwrap().meta.clone()); meta = Some(b.read().unwrap().meta.clone());
trace!("meta at {} {:?}", i, meta); trace!("recover {:x} meta at {} {:?}", debug_id, j, meta);
} }
blobs.push(b); blobs.push(b);
} else { } else {
@ -386,7 +488,7 @@ pub fn recover(
erasures.push((i - block_start) as i32); erasures.push((i - block_start) as i32);
} }
} }
for i in coding_start..coding_end { for i in coding_start..block_end {
let j = i % window.len(); let j = i % window.len();
if let Some(b) = window[j].coding.clone() { if let Some(b) = window[j].coding.clone() {
if size.is_none() { if size.is_none() {
@ -401,8 +503,8 @@ pub fn recover(
erasures.push(((i - coding_start) + NUM_DATA) as i32); erasures.push(((i - coding_start) + NUM_DATA) as i32);
} }
} }
// now that we have size, zero out data blob tails // now that we have size (from coding), zero out data blob tails
for i in block_start..coding_end { for i in block_start..block_end {
let j = i % window.len(); let j = i % window.len();
if let Some(b) = &window[j].data { if let Some(b) = &window[j].data {
@ -414,14 +516,15 @@ pub fn recover(
} }
} }
// marks end of erasures
erasures.push(-1); erasures.push(-1);
trace!( trace!(
"erasures: {:?} data_size: {} header_size: {}", "erasures[]: {:x} {:?} data_size: {}",
debug_id,
erasures, erasures,
size.unwrap(), size.unwrap(),
BLOB_HEADER_SIZE
); );
//lock everything //lock everything for write
for b in &blobs { for b in &blobs {
locks.push(b.write().expect("'locks' arr in pb fn recover")); locks.push(b.write().expect("'locks' arr in pb fn recover"));
} }
@ -431,15 +534,16 @@ pub fn recover(
let mut data_ptrs: Vec<&mut [u8]> = Vec::with_capacity(NUM_DATA); let mut data_ptrs: Vec<&mut [u8]> = Vec::with_capacity(NUM_DATA);
for (i, l) in locks.iter_mut().enumerate() { for (i, l) in locks.iter_mut().enumerate() {
if i < NUM_DATA { if i < NUM_DATA {
trace!("pushing data: {}", i); trace!("{:x} pushing data: {}", debug_id, i);
data_ptrs.push(&mut l.data[..size.unwrap()]); data_ptrs.push(&mut l.data[..size.unwrap()]);
} else { } else {
trace!("pushing coding: {}", i); trace!("{:x} pushing coding: {}", debug_id, i);
coding_ptrs.push(&mut l.data_mut()[..size.unwrap()]); coding_ptrs.push(&mut l.data_mut()[..size.unwrap()]);
} }
} }
trace!( trace!(
"coding_ptrs.len: {} data_ptrs.len {}", "{:x} coding_ptrs.len: {} data_ptrs.len {}",
debug_id,
coding_ptrs.len(), coding_ptrs.len(),
data_ptrs.len() data_ptrs.len()
); );
@ -449,27 +553,41 @@ pub fn recover(
&erasures, &erasures,
)?; )?;
} }
let mut corrupt = false;
// repopulate header data size from recovered blob contents
for i in &erasures[..erasures.len() - 1] { for i in &erasures[..erasures.len() - 1] {
let idx = *i as usize; let n = *i as usize;
let mut idx = n as u64 + block_start_idx;
let mut data_size; let mut data_size;
if idx < NUM_DATA { if n < NUM_DATA {
data_size = locks[idx].get_data_size().unwrap(); data_size = locks[n].get_data_size().unwrap();
data_size -= BLOB_HEADER_SIZE as u64; data_size -= BLOB_HEADER_SIZE as u64;
} else { } else {
data_size = size.unwrap() as u64; data_size = size.unwrap() as u64;
idx -= NUM_CODING as u64;
locks[n].set_index(idx).unwrap();
} }
locks[idx].meta = meta.clone().unwrap(); locks[n].meta = meta.clone().unwrap();
locks[idx].set_size(data_size as usize); locks[n].set_size(data_size as usize);
trace!( trace!(
"erasures[{}] size: {} data[0]: {}", "{:x} erasures[{}] ({}) size: {:x} data[0]: {}",
debug_id,
*i, *i,
idx,
data_size, data_size,
locks[idx].data()[0] locks[n].data()[0]
); );
if data_size > BLOB_SIZE as u64 {
corrupt = true;
} }
}
assert!(!corrupt, " {:x} ", debug_id);
block_start += NUM_DATA; block_start += NUM_DATA;
block_start_idx += NUM_DATA as u64;
} }
Ok(()) Ok(())
@ -480,12 +598,12 @@ mod test {
use crdt; use crdt;
use erasure; use erasure;
use logger; use logger;
use packet::BlobRecycler; use packet::{BlobRecycler, BLOB_HEADER_SIZE, BLOB_SIZE};
use rand::{thread_rng, Rng}; use rand::{thread_rng, Rng};
use signature::KeyPair; use signature::KeyPair;
use signature::KeyPairUtil; use signature::KeyPairUtil;
// use std::sync::{Arc, RwLock}; // use std::sync::{Arc, RwLock};
use streamer::WindowSlot; use streamer::{index_blobs, WindowSlot};
#[test] #[test]
pub fn test_coding() { pub fn test_coding() {
@ -549,12 +667,14 @@ mod test {
window_l2.get_index(), window_l2.get_index(),
window_l2.meta.size window_l2.meta.size
); );
for i in 0..8 { for i in 0..64 {
print!("{:>w$} ", window_l2.data()[i], w = 2); print!("{:>w$} ", window_l2.data()[i], w = 3);
} }
} else { } else {
print!("data null "); print!("data null ");
} }
println!("");
print!("window({:>w$}): ", i, w = 2);
if w.coding.is_some() { if w.coding.is_some() {
let window_l1 = w.coding.clone().unwrap(); let window_l1 = w.coding.clone().unwrap();
let window_l2 = window_l1.read().unwrap(); let window_l2 = window_l1.read().unwrap();
@ -564,16 +684,16 @@ mod test {
window_l2.meta.size window_l2.meta.size
); );
for i in 0..8 { for i in 0..8 {
print!("{:>w$} ", window_l2.data()[i], w = 2); print!("{:>w$} ", window_l2.data()[i], w = 3);
} }
} else { } else {
print!("coding null"); print!("coding null");
} }
println!(""); println!("");
} }
} }
const WINDOW_SIZE: usize = 64;
fn generate_window( fn generate_window(
blob_recycler: &BlobRecycler, blob_recycler: &BlobRecycler,
offset: usize, offset: usize,
@ -584,9 +704,9 @@ mod test {
data: None, data: None,
coding: None coding: None
}; };
32 WINDOW_SIZE
]; ];
let mut blobs = Vec::new(); let mut blobs = Vec::with_capacity(num_blobs);
for i in 0..num_blobs { for i in 0..num_blobs {
let b = blob_recycler.allocate(); let b = blob_recycler.allocate();
let b_ = b.clone(); let b_ = b.clone();
@ -599,8 +719,11 @@ mod test {
for k in 0..data_len { for k in 0..data_len {
w.data_mut()[k] = (k + i) as u8; w.data_mut()[k] = (k + i) as u8;
} }
// overfill, simulates re-used blobs // overfill, simulates re-used blobs
w.data_mut()[data_len] = thread_rng().gen(); for i in BLOB_HEADER_SIZE + data_len..BLOB_SIZE {
w.data[i] = thread_rng().gen();
}
blobs.push(b_); blobs.push(b_);
} }
@ -613,9 +736,10 @@ mod test {
"127.0.0.1:1237".parse().unwrap(), "127.0.0.1:1237".parse().unwrap(),
"127.0.0.1:1238".parse().unwrap(), "127.0.0.1:1238".parse().unwrap(),
); );
assert!(crdt::Crdt::index_blobs(&d, &blobs, &mut (offset as u64)).is_ok()); assert!(index_blobs(&d, &blobs, &mut (offset as u64)).is_ok());
for b in blobs { for b in blobs {
let idx = b.read().unwrap().get_index().unwrap() as usize; let idx = b.read().unwrap().get_index().unwrap() as usize % WINDOW_SIZE;
window[idx].data = Some(b); window[idx].data = Some(b);
} }
window window
@ -630,7 +754,9 @@ mod test {
} as usize; } as usize;
let mut b_l = b.write().unwrap(); let mut b_l = b.write().unwrap();
b_l.data[size] = thread_rng().gen(); for i in size..BLOB_SIZE {
b_l.data[i] = thread_rng().gen();
}
} }
} }
} }
@ -640,15 +766,49 @@ mod test {
logger::setup(); logger::setup();
let blob_recycler = BlobRecycler::default(); let blob_recycler = BlobRecycler::default();
{
let mut blobs = Vec::with_capacity(WINDOW_SIZE * 2);
for _ in 0..WINDOW_SIZE * 10 {
let blob = blob_recycler.allocate();
{
let mut b_l = blob.write().unwrap();
for i in 0..BLOB_SIZE {
b_l.data[i] = thread_rng().gen();
}
// some of the blobs should previously been used for coding
if thread_rng().gen_bool(erasure::NUM_CODING as f64 / erasure::NUM_DATA as f64)
{
b_l.set_coding().unwrap();
}
}
blobs.push(blob);
}
for blob in blobs {
blob_recycler.recycle(blob);
}
}
// Generate a window // Generate a window
let offset = 1; let offset = 0;
let num_blobs = erasure::NUM_DATA + 2; let num_blobs = erasure::NUM_DATA + 2;
let mut window = generate_window(&blob_recycler, 0, num_blobs); let mut window = generate_window(&blob_recycler, WINDOW_SIZE, num_blobs);
for i in 0..window.len() {
if let Some(blob) = &window[i].data {
let blob_r = blob.read().unwrap();
assert!(!blob_r.is_coding());
}
}
println!("** after-gen-window:"); println!("** after-gen-window:");
print_window(&window); print_window(&window);
// Generate the coding blocks // Generate the coding blocks
assert!(erasure::generate_coding(&mut window, &blob_recycler, offset, num_blobs).is_ok()); assert!(
erasure::generate_coding(0, &mut window, &blob_recycler, offset, num_blobs).is_ok()
);
println!("** after-gen-coding:"); println!("** after-gen-coding:");
print_window(&window); print_window(&window);
@ -664,7 +824,16 @@ mod test {
scramble_window_tails(&mut window, num_blobs); scramble_window_tails(&mut window, num_blobs);
// Recover it from coding // Recover it from coding
assert!(erasure::recover(&blob_recycler, &mut window, offset, num_blobs).is_ok()); assert!(
erasure::recover(
0,
&blob_recycler,
&mut window,
(offset + WINDOW_SIZE) as u64,
offset,
num_blobs
).is_ok()
);
println!("** after-recover:"); println!("** after-recover:");
print_window(&window); print_window(&window);
@ -684,7 +853,10 @@ mod test {
assert_eq!(window_l2.meta.addr, ref_l2.meta.addr); assert_eq!(window_l2.meta.addr, ref_l2.meta.addr);
assert_eq!(window_l2.meta.port, ref_l2.meta.port); assert_eq!(window_l2.meta.port, ref_l2.meta.port);
assert_eq!(window_l2.meta.v6, ref_l2.meta.v6); assert_eq!(window_l2.meta.v6, ref_l2.meta.v6);
assert_eq!(window_l2.get_index().unwrap(), erase_offset as u64); assert_eq!(
window_l2.get_index().unwrap(),
(erase_offset + WINDOW_SIZE) as u64
);
} }
println!("** whack coding block and data block"); println!("** whack coding block and data block");
@ -700,7 +872,16 @@ mod test {
print_window(&window); print_window(&window);
// Recover it from coding // Recover it from coding
assert!(erasure::recover(&blob_recycler, &mut window, offset, num_blobs).is_ok()); assert!(
erasure::recover(
0,
&blob_recycler,
&mut window,
(offset + WINDOW_SIZE) as u64,
offset,
num_blobs
).is_ok()
);
println!("** after-recover:"); println!("** after-recover:");
print_window(&window); print_window(&window);
@ -718,7 +899,65 @@ mod test {
assert_eq!(window_l2.meta.addr, ref_l2.meta.addr); assert_eq!(window_l2.meta.addr, ref_l2.meta.addr);
assert_eq!(window_l2.meta.port, ref_l2.meta.port); assert_eq!(window_l2.meta.port, ref_l2.meta.port);
assert_eq!(window_l2.meta.v6, ref_l2.meta.v6); assert_eq!(window_l2.meta.v6, ref_l2.meta.v6);
assert_eq!(window_l2.get_index().unwrap(), erase_offset as u64); assert_eq!(
window_l2.get_index().unwrap(),
(erase_offset + WINDOW_SIZE) as u64
);
}
println!("** make stale data block index");
// tests erasing a coding block
let erase_offset = offset;
// Create a hole in the window by making the blob's index stale
let refwindow = window[offset].data.clone();
if let Some(blob) = &window[erase_offset].data {
blob.write()
.unwrap()
.set_index(erase_offset as u64)
.unwrap(); // this also writes to refwindow...
}
print_window(&window);
// Recover it from coding
assert!(
erasure::recover(
0,
&blob_recycler,
&mut window,
(offset + WINDOW_SIZE) as u64,
offset,
num_blobs
).is_ok()
);
println!("** after-recover:");
print_window(&window);
// fix refwindow, we wrote to it above...
if let Some(blob) = &refwindow {
blob.write()
.unwrap()
.set_index((erase_offset + WINDOW_SIZE) as u64)
.unwrap(); // this also writes to refwindow...
}
{
// Check the result, block is here to drop locks
let window_l = window[erase_offset].data.clone().unwrap();
let window_l2 = window_l.read().unwrap();
let ref_l = refwindow.clone().unwrap();
let ref_l2 = ref_l.read().unwrap();
assert_eq!(window_l2.meta.size, ref_l2.meta.size);
assert_eq!(
window_l2.data[..window_l2.meta.size],
ref_l2.data[..window_l2.meta.size]
);
assert_eq!(window_l2.meta.addr, ref_l2.meta.addr);
assert_eq!(window_l2.meta.port, ref_l2.meta.port);
assert_eq!(window_l2.meta.v6, ref_l2.meta.v6);
assert_eq!(
window_l2.get_index().unwrap(),
(erase_offset + WINDOW_SIZE) as u64
);
} }
} }

View File

@ -142,7 +142,7 @@ impl FullNode {
fn new_window( fn new_window(
ledger_tail: Option<Vec<Entry>>, ledger_tail: Option<Vec<Entry>>,
entry_height: u64, entry_height: u64,
crdt: &Arc<RwLock<Crdt>>, node_info: &NodeInfo,
blob_recycler: &BlobRecycler, blob_recycler: &BlobRecycler,
) -> streamer::Window { ) -> streamer::Window {
match ledger_tail { match ledger_tail {
@ -153,7 +153,7 @@ impl FullNode {
// flatten deque to vec // flatten deque to vec
let blobs: Vec<_> = blobs.into_iter().collect(); let blobs: Vec<_> = blobs.into_iter().collect();
streamer::initialized_window(&crdt, blobs, entry_height) streamer::initialized_window(&node_info, blobs, entry_height)
} }
None => streamer::default_window(), None => streamer::default_window(),
} }
@ -203,6 +203,8 @@ impl FullNode {
thread_hdls.extend(rpu.thread_hdls()); thread_hdls.extend(rpu.thread_hdls());
let blob_recycler = BlobRecycler::default(); let blob_recycler = BlobRecycler::default();
let window = FullNode::new_window(ledger_tail, entry_height, &node.data, &blob_recycler);
let crdt = Arc::new(RwLock::new(Crdt::new(node.data).expect("Crdt::new"))); let crdt = Arc::new(RwLock::new(Crdt::new(node.data).expect("Crdt::new")));
let (tpu, blob_receiver) = Tpu::new( let (tpu, blob_receiver) = Tpu::new(
&bank, &bank,
@ -214,7 +216,6 @@ impl FullNode {
writer, writer,
); );
thread_hdls.extend(tpu.thread_hdls()); thread_hdls.extend(tpu.thread_hdls());
let window = FullNode::new_window(ledger_tail, entry_height, &crdt, &blob_recycler);
let ncp = Ncp::new( let ncp = Ncp::new(
&crdt, &crdt,
window.clone(), window.clone(),
@ -285,15 +286,14 @@ impl FullNode {
); );
thread_hdls.extend(rpu.thread_hdls()); thread_hdls.extend(rpu.thread_hdls());
let blob_recycler = BlobRecycler::default();
let window = FullNode::new_window(ledger_tail, entry_height, &node.data, &blob_recycler);
let crdt = Arc::new(RwLock::new(Crdt::new(node.data).expect("Crdt::new"))); let crdt = Arc::new(RwLock::new(Crdt::new(node.data).expect("Crdt::new")));
crdt.write() crdt.write()
.expect("'crdt' write lock before insert() in pub fn replicate") .expect("'crdt' write lock before insert() in pub fn replicate")
.insert(&entry_point); .insert(&entry_point);
let blob_recycler = BlobRecycler::default();
let window = FullNode::new_window(ledger_tail, entry_height, &crdt, &blob_recycler);
let ncp = Ncp::new( let ncp = Ncp::new(
&crdt, &crdt,
window.clone(), window.clone(),

View File

@ -166,14 +166,14 @@ pub fn blob_receiver(
fn find_next_missing( fn find_next_missing(
window: &Window, window: &Window,
crdt: &Arc<RwLock<Crdt>>, crdt: &Arc<RwLock<Crdt>>,
consumed: &mut u64, consumed: u64,
received: &mut u64, received: u64,
) -> Result<Vec<(SocketAddr, Vec<u8>)>> { ) -> Result<Vec<(SocketAddr, Vec<u8>)>> {
if *received <= *consumed { if received <= consumed {
Err(WindowError::GenericError)?; Err(WindowError::GenericError)?;
} }
let window = window.read().unwrap(); let window = window.read().unwrap();
let reqs: Vec<_> = (*consumed..*received) let reqs: Vec<_> = (consumed..received)
.filter_map(|pix| { .filter_map(|pix| {
let i = (pix % WINDOW_SIZE) as usize; let i = (pix % WINDOW_SIZE) as usize;
if window[i].data.is_none() { if window[i].data.is_none() {
@ -194,23 +194,18 @@ fn repair_window(
crdt: &Arc<RwLock<Crdt>>, crdt: &Arc<RwLock<Crdt>>,
last: &mut u64, last: &mut u64,
times: &mut usize, times: &mut usize,
consumed: &mut u64, consumed: u64,
received: &mut u64, received: u64,
) -> Result<()> { ) -> Result<()> {
//exponential backoff //exponential backoff
if *last != *consumed { if *last != consumed {
*times = 0; *times = 0;
} }
*last = *consumed; *last = consumed;
*times += 1; *times += 1;
//if times flips from all 1s 7 -> 8, 15 -> 16, we retry otherwise return Ok //if times flips from all 1s 7 -> 8, 15 -> 16, we retry otherwise return Ok
if *times & (*times - 1) != 0 { if *times & (*times - 1) != 0 {
trace!( trace!("repair_window counter {} {} {}", *times, consumed, received);
"repair_window counter {} {} {}",
*times,
*consumed,
*received
);
return Ok(()); return Ok(());
} }
@ -222,8 +217,8 @@ fn repair_window(
"{:x}: repair_window counter times: {} consumed: {} received: {} missing: {}", "{:x}: repair_window counter times: {} consumed: {} received: {} missing: {}",
debug_id, debug_id,
*times, *times,
*consumed, consumed,
*received, received,
reqs.len() reqs.len()
); );
} }
@ -231,8 +226,8 @@ fn repair_window(
for (to, req) in reqs { for (to, req) in reqs {
//todo cache socket //todo cache socket
debug!( debug!(
"{:x} repair_window request {} {} {}", "{:x}: repair_window request {} {} {}",
debug_id, *consumed, *received, to debug_id, consumed, received, to
); );
assert!(req.len() < BLOB_SIZE); assert!(req.len() < BLOB_SIZE);
sock.send_to(&req, to)?; sock.send_to(&req, to)?;
@ -245,8 +240,8 @@ fn retransmit_all_leader_blocks(
dq: &mut SharedBlobs, dq: &mut SharedBlobs,
debug_id: u64, debug_id: u64,
recycler: &BlobRecycler, recycler: &BlobRecycler,
consumed: &mut u64, consumed: u64,
received: &mut u64, received: u64,
retransmit: &BlobSender, retransmit: &BlobSender,
) -> Result<()> { ) -> Result<()> {
let mut retransmit_queue = VecDeque::new(); let mut retransmit_queue = VecDeque::new();
@ -288,8 +283,8 @@ fn retransmit_all_leader_blocks(
debug!( debug!(
"{:x}: RECV_WINDOW {} {}: retransmit {}", "{:x}: RECV_WINDOW {} {}: retransmit {}",
debug_id, debug_id,
*consumed, consumed,
*received, received,
retransmit_queue.len(), retransmit_queue.len(),
); );
inc_new_counter!("streamer-recv_window-retransmit", retransmit_queue.len()); inc_new_counter!("streamer-recv_window-retransmit", retransmit_queue.len());
@ -298,40 +293,6 @@ fn retransmit_all_leader_blocks(
Ok(()) Ok(())
} }
/// make space in window for newly received blobs that come after
/// consumed, before received, clear any old ones
fn reset_slots(
window: &mut [WindowSlot],
recycler: &BlobRecycler,
consumed: u64,
received: u64,
debug_id: u64,
) {
for ix in consumed..received {
let k = (ix % WINDOW_SIZE) as usize;
let mut old = false;
if let Some(b) = &window[k].data {
old = b.read().unwrap().get_index().unwrap() < consumed;
}
if old {
if let Some(b) = mem::replace(&mut window[k].data, None) {
debug!("{:x}: recycling data blob at index {:}", debug_id, k);
recycler.recycle(b);
}
}
if let Some(b) = &window[k].coding {
old = b.read().unwrap().get_index().unwrap() < consumed;
}
if old {
if let Some(b) = mem::replace(&mut window[k].coding, None) {
debug!("{:x}: recycling coding blob at index {:}", debug_id, k);
recycler.recycle(b);
}
}
}
}
/// process a blob: Add blob to the window. If a continuous set of blobs /// process a blob: Add blob to the window. If a continuous set of blobs
/// starting from consumed is thereby formed, add that continuous /// starting from consumed is thereby formed, add that continuous
/// range of blobs to a queue to be sent on to the next stage. /// range of blobs to a queue to be sent on to the next stage.
@ -348,9 +309,8 @@ fn reset_slots(
/// * `consumed` - input/output, the entry-height to which this /// * `consumed` - input/output, the entry-height to which this
/// node has populated and rebroadcast entries /// node has populated and rebroadcast entries
fn process_blob( fn process_blob(
b: SharedBlob, blob: SharedBlob,
pix: u64, pix: u64,
w: usize,
consume_queue: &mut SharedBlobs, consume_queue: &mut SharedBlobs,
window: &Window, window: &Window,
debug_id: u64, debug_id: u64,
@ -359,70 +319,70 @@ fn process_blob(
received: u64, received: u64,
) { ) {
let mut window = window.write().unwrap(); let mut window = window.write().unwrap();
let w = (pix % WINDOW_SIZE) as usize;
if pix == received {
// When pix == received, we've *just* updated received, which means
// possibly new slots between consumed and received have been exposed,
// so clean up old blobs between consumed and received
reset_slots(&mut window, recycler, *consumed, received, debug_id);
}
let is_coding = { let is_coding = {
let blob_r = b.read().expect("blob read lock for flogs streamer::window"); let blob_r = blob.read()
.expect("blob read lock for flogs streamer::window");
blob_r.is_coding() blob_r.is_coding()
}; };
// insert the new blob into the window if it's coding or data // insert the new blob into the window, overwrite and recycle old (or duplicate) entry
if is_coding { let is_duplicate = if is_coding {
// Insert the new blob into the window if let Some(old) = mem::replace(&mut window[w].coding, Some(blob)) {
// spot should be free because we cleared it above if old.read().unwrap().get_index().unwrap() == pix {
if window[w].coding.is_none() { trace!("{:x}: duplicate coding blob at index {:}", debug_id, pix);
window[w].coding = Some(b);
} else if let Some(blob) = &window[w].coding {
if blob.read().unwrap().get_index().unwrap() != pix as u64 {
warn!("{:x}: overrun coding blob at index {:}", debug_id, w);
} else {
debug!("{:x}: duplicate coding blob at index {:}", debug_id, w);
} }
trace!("{:x}: recycling coding blob at index {:}", debug_id, pix);
recycler.recycle(old);
true
} else {
trace!("{:x}: empty coding window slot {:}", debug_id, pix);
false
} }
} else { } else {
if window[w].data.is_none() { if let Some(old) = mem::replace(&mut window[w].data, Some(blob)) {
window[w].data = Some(b); if old.read().unwrap().get_index().unwrap() == pix {
} else if let Some(blob) = &window[w].data { trace!("{:x}: duplicate data blob at index {:}", debug_id, pix);
if blob.read().unwrap().get_index().unwrap() != pix as u64 { }
warn!("{:x}: overrun data blob at index {:}", debug_id, w); trace!("{:x}: recycling data blob at index {:}", debug_id, pix);
recycler.recycle(old);
true
} else { } else {
debug!("{:x}: duplicate data blob at index {:}", debug_id, w); trace!("{:x}: empty data window slot {:}", debug_id, pix);
} false
} }
};
if is_duplicate {
return;
} }
#[cfg(feature = "erasure")] #[cfg(feature = "erasure")]
{ {
if erasure::recover( if erasure::recover(
debug_id,
recycler, recycler,
&mut window, &mut window,
*consumed,
(*consumed % WINDOW_SIZE) as usize, (*consumed % WINDOW_SIZE) as usize,
(received - *consumed) as usize, (received - *consumed) as usize,
).is_err() ).is_err()
{ {
trace!("erasure::recover failed"); trace!("{:x}: erasure::recover failed", debug_id);
} }
} }
// // Search the window for wrong data blobs...
// for ix in *consumed..(received + 1) {
// let k = (ix % WINDOW_SIZE) as usize;
//
// if let Some(b) = &window[k].data {
// assert_eq!(ix, b.read().unwrap().get_index().unwrap());
// }
// }
// push all contiguous blobs into consumed queue, increment consumed // push all contiguous blobs into consumed queue, increment consumed
loop { loop {
let k = (*consumed % WINDOW_SIZE) as usize; let k = (*consumed % WINDOW_SIZE) as usize;
trace!("k: {} consumed: {} received: {}", k, *consumed, received); trace!(
"{:x}: k: {} consumed: {} received: {}",
debug_id,
k,
*consumed,
received
);
if let Some(blob) = &window[k].data { if let Some(blob) = &window[k].data {
if blob.read().unwrap().get_index().unwrap() < *consumed { if blob.read().unwrap().get_index().unwrap() < *consumed {
@ -433,7 +393,6 @@ fn process_blob(
// window[k].data is None, end of received // window[k].data is None, end of received
break; break;
} }
consume_queue.push_back(window[k].data.clone().expect("clone in fn recv_window")); consume_queue.push_back(window[k].data.clone().expect("clone in fn recv_window"));
*consumed += 1; *consumed += 1;
} }
@ -473,8 +432,8 @@ fn recv_window(
&mut dq, &mut dq,
debug_id, debug_id,
recycler, recycler,
consumed, *consumed,
received, *received,
retransmit, retransmit,
)?; )?;
@ -497,16 +456,12 @@ fn recv_window(
); );
continue; continue;
} }
let w = (pix % WINDOW_SIZE) as usize;
//TODO, after the block are authenticated trace!("{:x} window pix: {} size: {}", debug_id, pix, meta_size);
//if we get different blocks at the same index
//that is a network failure/attack
trace!("window w: {} size: {}", w, meta_size);
process_blob( process_blob(
b, b,
pix, pix,
w,
&mut consume_queue, &mut consume_queue,
window, window,
debug_id, debug_id,
@ -516,7 +471,11 @@ fn recv_window(
); );
} }
print_window(debug_id, window, *consumed); print_window(debug_id, window, *consumed);
trace!("sending consume_queue.len: {}", consume_queue.len()); trace!(
"{:x}: sending consume_queue.len: {}",
debug_id,
consume_queue.len()
);
if !consume_queue.is_empty() { if !consume_queue.is_empty() {
debug!( debug!(
"{:x}: RECV_WINDOW {} {}: forwarding consume_queue {}", "{:x}: RECV_WINDOW {} {}: forwarding consume_queue {}",
@ -525,7 +484,11 @@ fn recv_window(
*received, *received,
consume_queue.len(), consume_queue.len(),
); );
trace!("sending consume_queue.len: {}", consume_queue.len()); trace!(
"{:x}: sending consume_queue.len: {}",
debug_id,
consume_queue.len()
);
inc_new_counter!("streamer-recv_window-consume", consume_queue.len()); inc_new_counter!("streamer-recv_window-consume", consume_queue.len());
s.send(consume_queue)?; s.send(consume_queue)?;
} }
@ -533,28 +496,45 @@ fn recv_window(
} }
fn print_window(debug_id: u64, window: &Window, consumed: u64) { fn print_window(debug_id: u64, window: &Window, consumed: u64) {
let buf: Vec<_> = window let pointer: Vec<_> = window
.read() .read()
.unwrap() .unwrap()
.iter() .iter()
.enumerate() .enumerate()
.map(|(i, v)| { .map(|(i, _v)| {
if i == (consumed % WINDOW_SIZE) as usize { if i == (consumed % WINDOW_SIZE) as usize {
"_" "V"
} else if v.data.is_none() && v.coding.is_none() {
"0"
} else if v.data.is_some() && v.coding.is_some() {
"X"
} else if v.data.is_some() {
// coding.is_none()
"D"
} else { } else {
// data.is_none() " "
"C"
} }
}) })
.collect(); .collect();
trace!("{:x}:WINDOW ({}): {}", debug_id, consumed, buf.join(""));
let buf: Vec<_> = window
.read()
.unwrap()
.iter()
.map(|v| {
if v.data.is_none() && v.coding.is_none() {
"O"
} else if v.data.is_some() && v.coding.is_some() {
"D"
} else if v.data.is_some() {
// coding.is_none()
"d"
} else {
// data.is_none()
"c"
}
})
.collect();
trace!(
"{:x}: WINDOW ({}): {}",
debug_id,
consumed,
pointer.join("")
);
trace!("{:x}: WINDOW ({}): {}", debug_id, consumed, buf.join(""));
} }
pub fn default_window() -> Window { pub fn default_window() -> Window {
@ -564,37 +544,58 @@ pub fn default_window() -> Window {
])) ]))
} }
pub fn index_blobs(
node_info: &NodeInfo,
blobs: &[SharedBlob],
receive_index: &mut u64,
) -> Result<()> {
// enumerate all the blobs, those are the indices
trace!("{:x}: INDEX_BLOBS {}", node_info.debug_id(), blobs.len());
for (i, b) in blobs.iter().enumerate() {
// only leader should be broadcasting
let mut blob = b.write().expect("'blob' write lock in crdt::index_blobs");
blob.set_id(node_info.id)
.expect("set_id in pub fn broadcast");
blob.set_index(*receive_index + i as u64)
.expect("set_index in pub fn broadcast");
blob.set_flags(0).unwrap();
}
Ok(())
}
/// Initialize a rebroadcast window with most recent Entry blobs /// Initialize a rebroadcast window with most recent Entry blobs
/// * `crdt` - gossip instance, used to set blob ids /// * `crdt` - gossip instance, used to set blob ids
/// * `blobs` - up to WINDOW_SIZE most recent blobs /// * `blobs` - up to WINDOW_SIZE most recent blobs
/// * `entry_height` - current entry height /// * `entry_height` - current entry height
pub fn initialized_window( pub fn initialized_window(
crdt: &Arc<RwLock<Crdt>>, node_info: &NodeInfo,
blobs: Vec<SharedBlob>, blobs: Vec<SharedBlob>,
entry_height: u64, entry_height: u64,
) -> Window { ) -> Window {
let window = default_window(); let window = default_window();
let debug_id = node_info.debug_id();
{ {
let mut win = window.write().unwrap(); let mut win = window.write().unwrap();
let me = crdt.read().unwrap().my_data().clone();
debug!( trace!(
"initialized window entry_height:{} blobs_len:{}", "{:x} initialized window entry_height:{} blobs_len:{}",
debug_id,
entry_height, entry_height,
blobs.len() blobs.len()
); );
// Index the blobs // Index the blobs
let mut received = entry_height - blobs.len() as u64; let mut received = entry_height - blobs.len() as u64;
Crdt::index_blobs(&me, &blobs, &mut received).expect("index blobs for initial window"); index_blobs(&node_info, &blobs, &mut received).expect("index blobs for initial window");
// populate the window, offset by implied index // populate the window, offset by implied index
let diff = cmp::max(blobs.len() as isize - win.len() as isize, 0) as usize; let diff = cmp::max(blobs.len() as isize - win.len() as isize, 0) as usize;
for b in blobs.into_iter().skip(diff) { for b in blobs.into_iter().skip(diff) {
let ix = b.read().unwrap().get_index().expect("blob index"); let ix = b.read().unwrap().get_index().expect("blob index");
let pos = (ix % WINDOW_SIZE) as usize; let pos = (ix % WINDOW_SIZE) as usize;
trace!("caching {} at {}", ix, pos); trace!("{:x} caching {} at {}", debug_id, ix, pos);
assert!(win[pos].data.is_none()); assert!(win[pos].data.is_none());
win[pos].data = Some(b); win[pos].data = Some(b);
} }
@ -643,22 +644,15 @@ pub fn window(
} }
} }
let _ = repair_window( let _ = repair_window(
debug_id, debug_id, &window, &crdt, &mut last, &mut times, consumed, received,
&window,
&crdt,
&mut last,
&mut times,
&mut consumed,
&mut received,
); );
assert!(consumed <= (received + 1));
} }
}) })
.unwrap() .unwrap()
} }
fn broadcast( fn broadcast(
me: &NodeInfo, node_info: &NodeInfo,
broadcast_table: &[NodeInfo], broadcast_table: &[NodeInfo],
window: &Window, window: &Window,
recycler: &BlobRecycler, recycler: &BlobRecycler,
@ -667,7 +661,7 @@ fn broadcast(
transmit_index: &mut u64, transmit_index: &mut u64,
receive_index: &mut u64, receive_index: &mut u64,
) -> Result<()> { ) -> Result<()> {
let debug_id = me.debug_id(); let debug_id = node_info.debug_id();
let timer = Duration::new(1, 0); let timer = Duration::new(1, 0);
let mut dq = r.recv_timeout(timer)?; let mut dq = r.recv_timeout(timer)?;
while let Ok(mut nq) = r.try_recv() { while let Ok(mut nq) = r.try_recv() {
@ -681,14 +675,15 @@ fn broadcast(
// break them up into window-sized chunks to process // break them up into window-sized chunks to process
let blobs_chunked = blobs_vec.chunks(WINDOW_SIZE as usize).map(|x| x.to_vec()); let blobs_chunked = blobs_vec.chunks(WINDOW_SIZE as usize).map(|x| x.to_vec());
print_window(me.debug_id(), window, *receive_index); print_window(debug_id, window, *receive_index);
for mut blobs in blobs_chunked { for mut blobs in blobs_chunked {
let blobs_len = blobs.len(); let blobs_len = blobs.len();
debug!("{:x} broadcast blobs.len: {}", debug_id, blobs_len); trace!("{:x}: broadcast blobs.len: {}", debug_id, blobs_len);
// Index the blobs // Index the blobs
Crdt::index_blobs(&me, &blobs, receive_index)?; index_blobs(node_info, &blobs, receive_index).expect("index blobs for initial window");
// keep the cache of blobs that are broadcast // keep the cache of blobs that are broadcast
inc_new_counter!("streamer-broadcast-sent", blobs.len()); inc_new_counter!("streamer-broadcast-sent", blobs.len());
{ {
@ -699,7 +694,8 @@ fn broadcast(
let pos = (ix % WINDOW_SIZE) as usize; let pos = (ix % WINDOW_SIZE) as usize;
if let Some(x) = mem::replace(&mut win[pos].data, None) { if let Some(x) = mem::replace(&mut win[pos].data, None) {
trace!( trace!(
"popped {} at {}", "{:x} popped {} at {}",
debug_id,
x.read().unwrap().get_index().unwrap(), x.read().unwrap().get_index().unwrap(),
pos pos
); );
@ -707,19 +703,20 @@ fn broadcast(
} }
if let Some(x) = mem::replace(&mut win[pos].coding, None) { if let Some(x) = mem::replace(&mut win[pos].coding, None) {
trace!( trace!(
"popped {} at {}", "{:x} popped {} at {}",
debug_id,
x.read().unwrap().get_index().unwrap(), x.read().unwrap().get_index().unwrap(),
pos pos
); );
recycler.recycle(x); recycler.recycle(x);
} }
trace!("null {}", pos); trace!("{:x} null {}", debug_id, pos);
} }
while let Some(b) = blobs.pop() { while let Some(b) = blobs.pop() {
let ix = b.read().unwrap().get_index().expect("blob index"); let ix = b.read().unwrap().get_index().expect("blob index");
let pos = (ix % WINDOW_SIZE) as usize; let pos = (ix % WINDOW_SIZE) as usize;
trace!("caching {} at {}", ix, pos); trace!("{:x} caching {} at {}", debug_id, ix, pos);
assert!(win[pos].data.is_none()); assert!(win[pos].data.is_none());
win[pos].data = Some(b); win[pos].data = Some(b);
} }
@ -729,6 +726,7 @@ fn broadcast(
#[cfg(feature = "erasure")] #[cfg(feature = "erasure")]
{ {
erasure::generate_coding( erasure::generate_coding(
debug_id,
&mut window.write().unwrap(), &mut window.write().unwrap(),
recycler, recycler,
(*receive_index % WINDOW_SIZE) as usize, (*receive_index % WINDOW_SIZE) as usize,
@ -740,7 +738,7 @@ fn broadcast(
// Send blobs out from the window // Send blobs out from the window
Crdt::broadcast( Crdt::broadcast(
&me, &node_info,
&broadcast_table, &broadcast_table,
&window, &window,
&sock, &sock,