Merge pull request #4 from Kryptos-FR/buffered

Refactor using a buffer for reading and a buffer for writing
This commit is contained in:
nora 2021-09-04 17:07:16 +02:00 committed by GitHub
commit 69832423b4
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
3 changed files with 90 additions and 46 deletions

2
Cargo.lock generated
View file

@ -1,5 +1,7 @@
# This file is automatically @generated by Cargo. # This file is automatically @generated by Cargo.
# It is not intended for manual editing. # It is not intended for manual editing.
version = 3
[[package]] [[package]]
name = "ansi_term" name = "ansi_term"
version = "0.11.0" version = "0.11.0"

View file

@ -3,6 +3,9 @@
//! //!
//! It does not do anything more than that, which makes it so fast. //! It does not do anything more than that, which makes it so fast.
use std::error::Error;
use std::io::{BufReader, BufWriter, Read, Write};
/// ///
/// Set the indentation used for the formatting. /// Set the indentation used for the formatting.
/// ///
@ -24,32 +27,52 @@ pub enum Indentation<'a> {
/// The default indentation is faster than a custom one /// The default indentation is faster than a custom one
/// ///
pub fn format_json(json: &str, indentation: Indentation) -> String { pub fn format_json(json: &str, indentation: Indentation) -> String {
// at least as big as the input to avoid resizing let mut reader = BufReader::new(json.as_bytes());
// this might be too big if the input string is formatted in a weird way, but that's not expected, and it will still be efficient let mut writer = BufWriter::new(Vec::new());
let mut out = String::with_capacity(json.len());
format_json_buffered(&mut reader, &mut writer, indentation).unwrap();
String::from_utf8(writer.into_inner().unwrap()).unwrap()
}
///
/// # Formats a json string
///
/// The indentation can be set to any value using [Indentation](jsonformat::Indentation)
/// The default value is two spaces
/// The default indentation is faster than a custom one
///
pub fn format_json_buffered<R, W>(
reader: &mut BufReader<R>,
writer: &mut BufWriter<W>,
indentation: Indentation,
) -> Result<(), Box<dyn Error>>
where
R: Read,
W: Write,
{
let mut escaped = false; let mut escaped = false;
let mut in_string = false; let mut in_string = false;
let mut indent_level = 0usize; let mut indent_level = 0usize;
let mut newline_requested = false; // invalidated if next character is ] or } let mut newline_requested = false; // invalidated if next character is ] or }
for char in json.chars() { for char in reader.bytes() {
let char = char?;
if in_string { if in_string {
let mut escape_here = false; let mut escape_here = false;
match char { match char {
'"' => { b'"' => {
if !escaped { if !escaped {
in_string = false; in_string = false;
} }
} }
'\\' => { b'\\' => {
if !escaped { if !escaped {
escape_here = true; escape_here = true;
} }
} }
_ => {} _ => {}
} }
out.push(char); writer.write_all(&[char])?;
escaped = escape_here; escaped = escape_here;
} else { } else {
let mut auto_push = true; let mut auto_push = true;
@ -57,65 +80,73 @@ pub fn format_json(json: &str, indentation: Indentation) -> String {
let old_level = indent_level; let old_level = indent_level;
match char { match char {
'"' => in_string = true, b'"' => in_string = true,
' ' | '\n' | '\t' => continue, b' ' | b'\n' | b'\t' => continue,
'[' => { b'[' => {
indent_level += 1; indent_level += 1;
request_newline = true; request_newline = true;
} }
'{' => { b'{' => {
indent_level += 1; indent_level += 1;
request_newline = true; request_newline = true;
} }
'}' | ']' => { b'}' | b']' => {
indent_level = indent_level.saturating_sub(1); indent_level = indent_level.saturating_sub(1);
if !newline_requested { if !newline_requested {
// see comment below about newline_requested // see comment below about newline_requested
out.push('\n'); writer.write_all(&[b'\n'])?;
indent(&mut out, indent_level, indentation); indent_buffered(writer, indent_level, indentation)?;
} }
} }
':' => { b':' => {
auto_push = false; auto_push = false;
out.push(char); writer.write_all(&[char])?;
out.push(' '); writer.write_all(&[b' '])?;
} }
',' => { b',' => {
request_newline = true; request_newline = true;
} }
_ => {} _ => {}
} }
if newline_requested && char != ']' && char != '}' { if newline_requested && char != b']' && char != b'}' {
// newline only happens after { [ and , // newline only happens after { [ and ,
// this means we can safely assume that it being followed up by } or ] // this means we can safely assume that it being followed up by } or ]
// means an empty object/array // means an empty object/array
out.push('\n'); writer.write_all(&[b'\n'])?;
indent(&mut out, old_level, indentation); indent_buffered(writer, old_level, indentation)?;
} }
if auto_push { if auto_push {
out.push(char); writer.write_all(&[char])?;
} }
newline_requested = request_newline; newline_requested = request_newline;
} }
} }
out Ok(())
} }
fn indent(buf: &mut String, level: usize, indent_str: Indentation) { fn indent_buffered<W>(
writer: &mut BufWriter<W>,
level: usize,
indent_str: Indentation,
) -> Result<(), Box<dyn Error>>
where
W: std::io::Write,
{
for _ in 0..level { for _ in 0..level {
match indent_str { match indent_str {
Indentation::Default => { Indentation::Default => {
buf.push(' '); writer.write_all(b" ")?;
buf.push(' ');
} }
Indentation::Custom(indent) => { Indentation::Custom(indent) => {
buf.push_str(indent); writer.write_all(indent.as_bytes())?;
} }
} }
} }
Ok(())
} }
#[cfg(test)] #[cfg(test)]

View file

@ -1,10 +1,10 @@
use clap::clap_app; use clap::clap_app;
use jsonformat::{format_json, Indentation}; use jsonformat::{format_json_buffered, Indentation};
use std::fs; use std::error::Error;
use std::io; use std::fs::File;
use std::io::Read; use std::io::{BufReader, BufWriter, Read, Write};
fn main() -> Result<(), io::Error> { fn main() -> Result<(), Box<dyn Error>> {
let matches = clap_app!(jsonformat => let matches = clap_app!(jsonformat =>
(version: "1.1") (version: "1.1")
(author: "nilstrieb <nilstrieb@gmail.com>") (author: "nilstrieb <nilstrieb@gmail.com>")
@ -16,13 +16,16 @@ fn main() -> Result<(), io::Error> {
) )
.get_matches(); .get_matches();
let str = match matches.value_of("input") { // Note: on-stack dynamic dispatch
Some(path) => fs::read_to_string(path)?, let (mut file, mut stdin);
let reader: &mut dyn Read = match matches.value_of("input") {
Some(path) => {
file = File::open(path)?;
&mut file
}
None => { None => {
let mut buf = String::new(); stdin = std::io::stdin();
let stdin = std::io::stdin(); &mut stdin
stdin.lock().read_to_string(&mut buf)?;
buf
} }
}; };
@ -41,8 +44,6 @@ fn main() -> Result<(), io::Error> {
None => Indentation::Default, None => Indentation::Default,
}; };
let formatted = format_json(&str, indent);
let mut output = matches.value_of("output"); let mut output = matches.value_of("output");
let mut windows_output_default_file: Option<String> = None; let mut windows_output_default_file: Option<String> = None;
@ -57,12 +58,22 @@ fn main() -> Result<(), io::Error> {
output = windows_output_default_file.as_deref().or(output); output = windows_output_default_file.as_deref().or(output);
match output { // Note: on-stack dynamic dispatch
Some(file) => { let (mut file, mut stdout);
fs::write(file, formatted)?; let writer: &mut dyn Write = match output {
} Some(filename) => {
None => println!("{}", formatted), file = File::create(filename)?;
} &mut file
},
None => {
stdout = std::io::stdout();
&mut stdout
},
};
let mut reader = BufReader::new(reader);
let mut writer = BufWriter::new(writer);
format_json_buffered(&mut reader, &mut writer, indent)?;
Ok(()) Ok(())
} }