rust/src/string.rs

97 lines
3.0 KiB
Rust
Raw Normal View History

2015-06-23 13:58:58 +00:00
// Copyright 2015 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
// Format string literals.
2015-09-04 03:38:12 +00:00
use unicode_segmentation::UnicodeSegmentation;
use regex::Regex;
use Indent;
use config::Config;
use utils::round_up_to_power_of_two;
2015-06-23 13:58:58 +00:00
use MIN_STRING;
pub struct StringFormat<'a> {
pub opener: &'a str,
pub closer: &'a str,
pub line_start: &'a str,
pub line_end: &'a str,
pub width: usize,
pub offset: Indent,
2015-06-23 13:58:58 +00:00
pub trim_end: bool,
pub config: &'a Config,
2015-06-23 13:58:58 +00:00
}
// TODO: simplify this!
pub fn rewrite_string<'a>(s: &str, fmt: &StringFormat<'a>) -> String {
// TODO if lo.col > IDEAL - 10, start a new line (need cur indent for that)
2015-09-04 03:38:12 +00:00
// Strip line breaks.
let re = Regex::new(r"(\\[:space:]+)").unwrap();
let stripped_str = re.replace_all(s, "");
let graphemes = UnicodeSegmentation::graphemes(&*stripped_str, false).collect::<Vec<&str>>();
2015-06-23 13:58:58 +00:00
let indent = fmt.offset.to_string(fmt.config);
2015-06-23 13:58:58 +00:00
let indent = &indent;
let mut cur_start = 0;
let mut result = String::with_capacity(round_up_to_power_of_two(s.len()));
result.push_str(fmt.opener);
let ender_length = fmt.line_end.len();
2015-09-10 22:52:16 +00:00
let max_chars = fmt.width.checked_sub(fmt.opener.len() + ender_length).unwrap_or(1);
2015-06-23 13:58:58 +00:00
loop {
let mut cur_end = cur_start + max_chars;
2015-09-04 03:38:12 +00:00
if cur_end >= graphemes.len() {
let line = &graphemes[cur_start..].join("");
result.push_str(line);
2015-06-23 13:58:58 +00:00
break;
}
// Push cur_end left until we reach whitespace.
2015-09-04 03:38:12 +00:00
while !(graphemes[cur_end - 1].trim().len() == 0) {
cur_end -= 1;
2015-06-23 13:58:58 +00:00
if cur_end - cur_start < MIN_STRING {
// We can't break at whitespace, fall back to splitting
// anywhere that doesn't break an escape sequence.
2015-09-04 03:38:12 +00:00
cur_end = cur_start + max_chars;
while graphemes[cur_end - 1] == "\\" {
cur_end -= 1;
2015-06-23 13:58:58 +00:00
}
break;
}
}
// Make sure there is no whitespace to the right of the break.
2015-09-04 03:38:12 +00:00
while cur_end < s.len() && graphemes[cur_end].trim().len() == 0 {
cur_end += 1;
2015-06-23 13:58:58 +00:00
}
2015-09-04 03:38:12 +00:00
let raw_line = graphemes[cur_start..cur_end].join("");
2015-09-09 11:56:56 +00:00
let line = if fmt.trim_end {
raw_line.trim()
2015-06-23 13:58:58 +00:00
} else {
2015-09-09 11:56:56 +00:00
// TODO: use as_str once it's stable.
&*raw_line
2015-06-23 13:58:58 +00:00
};
result.push_str(line);
result.push_str(fmt.line_end);
result.push('\n');
result.push_str(indent);
result.push_str(fmt.line_start);
cur_start = cur_end;
}
result.push_str(fmt.closer);
result
}