use crate::text::parse_result::{fatal_parse_error, IonParseResult, UpgradeIResult};
use nom::branch::alt;
use nom::bytes::streaming::{is_a, tag};
use nom::character::streaming::alphanumeric1;
use nom::combinator::{opt, recognize};
use nom::multi::{many0_count, many1_count};
use nom::sequence::{delimited, pair, terminated};
use crate::text::parsers::{whitespace, WHITESPACE_CHARACTERS};
use crate::text::text_value::TextValue;
pub(crate) fn parse_blob(input: &str) -> IonParseResult<TextValue> {
let (remaining_input, base64_text) = delimited(
pair(tag("{{"), opt(whitespace)),
recognize(many0_count(terminated(
recognize_base64_data,
opt(whitespace),
))),
pair(opt(whitespace), tag("}}")),
)(input)?;
let decode_result = if base64_text.contains(WHITESPACE_CHARACTERS) {
let sanitized = base64_text.replace(WHITESPACE_CHARACTERS, "");
base64::decode(sanitized)
} else {
base64::decode(base64_text)
};
match decode_result {
Ok(data) => Ok((remaining_input, TextValue::Blob(data))),
Err(e) => fatal_parse_error(base64_text, format!("could not decode base64 data: {e}")),
}
}
fn recognize_base64_data(input: &str) -> IonParseResult<&str> {
recognize(many1_count(alt((alphanumeric1, is_a("+/=")))))(input).upgrade()
}
#[cfg(test)]
mod blob_parsing_tests {
use std::iter::FromIterator;
use crate::text::parsers::blob::parse_blob;
use crate::text::parsers::unit_test_support::{parse_test_err, parse_test_ok};
use crate::text::text_value::TextValue;
fn parse_equals<A: AsRef<[u8]>>(text: &str, expected: A) {
let data = Vec::from_iter(expected.as_ref().iter().copied());
parse_test_ok(parse_blob, text, TextValue::Blob(data))
}
fn parse_fails(text: &str) {
parse_test_err(parse_blob, text)
}
#[test]
fn test_parse_blobs() {
parse_equals("{{aGVsbG8h}} ", "hello!");
parse_equals(
"{{YnJldml0eSBpcyB0aGUgc291bCBvZiB3aXQ=}} ",
"brevity is the soul of wit",
);
parse_equals("{{Zm9vLCBiYXIsIGJheiwgcXV1eA==}} ", "foo, bar, baz, quux");
parse_equals("{{ aGVsbG8h}} ", "hello!");
parse_equals("{{aGVsbG8h }} ", "hello!");
parse_equals("{{ aGVsbG8h }} ", "hello!");
parse_fails("{ {Zm9vLCBiYXIsIGJheiwgcXV1eA==}} ");
parse_fails("{{Zm9vLCBiYXIsIGJheiwgcXV1eA==} } ");
parse_fails("{{Zm9vLCBiYXIsIGJheiwgcXV1eA===}} ");
parse_fails("{{Zm9vLC=BiYXIsIGJheiwgcXV1eA==}} ");
parse_fails("{{Zm9vLCBiYXIsI_GJheiwgcXV1eA==}} ");
}
}