Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add option to specify chunk size #298

Open
wants to merge 3 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions replibyte/src/cli.rs
Original file line number Diff line number Diff line change
Expand Up @@ -110,6 +110,9 @@ pub struct DumpCreateArgs {
/// dump name
#[clap(short, long)]
pub name: Option<String>,
/// chunk size, default to 100
#[clap(short, long)]
pub chunk_size: Option<usize>,
}

#[derive(Args, Debug)]
Expand Down
1 change: 1 addition & 0 deletions replibyte/src/commands/dump.rs
Original file line number Diff line number Diff line change
Expand Up @@ -132,6 +132,7 @@ where
skip_config: &skip_config,
database_subset: &source.database_subset,
only_tables: &only_tables_config,
chunk_size: &args.chunk_size,
};

match args.source_type.as_ref().map(|x| x.as_str()) {
Expand Down
1 change: 1 addition & 0 deletions replibyte/src/source/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -29,4 +29,5 @@ pub struct SourceOptions<'a> {
pub skip_config: &'a Vec<SkipConfig>,
pub database_subset: &'a Option<DatabaseSubsetConfig>,
pub only_tables: &'a Vec<OnlyTablesConfig>,
pub chunk_size: &'a Option<usize>,
}
3 changes: 3 additions & 0 deletions replibyte/src/source/mongodb.rs
Original file line number Diff line number Diff line change
Expand Up @@ -368,6 +368,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

assert!(p.read(source_options, |_, _| {}).is_ok());
Expand All @@ -380,6 +381,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

assert!(p.read(source_options, |_, _| {}).is_err());
Expand All @@ -395,6 +397,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

p.read(source_options, |original_query, query| {
Expand Down
3 changes: 3 additions & 0 deletions replibyte/src/source/mysql.rs
Original file line number Diff line number Diff line change
Expand Up @@ -456,6 +456,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

assert!(p.read(source_options, |_original_query, _query| {}).is_ok());
Expand All @@ -468,6 +469,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};
assert!(p
.read(source_options, |_original_query, _query| {})
Expand All @@ -484,6 +486,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};
let _ = p.read(source_options, |original_query, query| {
assert!(original_query.data().len() > 0);
Expand Down
7 changes: 7 additions & 0 deletions replibyte/src/source/postgres.rs
Original file line number Diff line number Diff line change
Expand Up @@ -581,6 +581,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

assert!(p.read(source_options, |original_query, query| {}).is_ok());
Expand All @@ -593,6 +594,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

assert!(p.read(source_options, |original_query, query| {}).is_err());
Expand All @@ -608,6 +610,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

let _ = p.read(source_options, |original_query, query| {
Expand Down Expand Up @@ -734,6 +737,7 @@ mod tests {
skip_config: &vec![],
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

let _ = p.read(source_options, |original_query, query| {
Expand Down Expand Up @@ -775,6 +779,7 @@ mod tests {
skip_config: &skip_config,
database_subset: &None,
only_tables: &vec![],
chunk_size: &None,
};

let _ = p.read(source_options, |_original_query, query| {
Expand Down Expand Up @@ -826,6 +831,7 @@ mod tests {
passthrough_tables: None,
}),
only_tables: &vec![],
chunk_size: &None,
};

let mut rows_percent_50 = vec![];
Expand Down Expand Up @@ -863,6 +869,7 @@ mod tests {
passthrough_tables: None,
}),
only_tables: &vec![],
chunk_size: &None,
};

let mut rows_percent_30 = vec![];
Expand Down
5 changes: 3 additions & 2 deletions replibyte/src/tasks/full_dump.rs
Original file line number Diff line number Diff line change
Expand Up @@ -69,8 +69,9 @@ where
Ok(())
});

// buffer of 100MB in memory to use and re-use to upload data into datastore
let buffer_size = 100 * 1024 * 1024;
// buffer default of 100MB (unless specified) in memory to use and re-use to upload data into datastore
let chunk_size = self.options.chunk_size.unwrap_or(100);
let buffer_size = chunk_size * 1024 * 1024;
let mut queries = vec![];
let mut consumed_buffer_size = 0usize;
let mut total_transferred_bytes = 0usize;
Expand Down