Created
April 22, 2020 22:08
-
-
Save jonhoo/2a7fdcf79be03e51a5f95cd326f2a1e8 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#![warn(rust_2018_idioms)] | |
#[derive(Debug)] | |
pub struct StrSplit<'haystack, D> { | |
remainder: Option<&'haystack str>, | |
delimiter: D, | |
} | |
impl<'haystack, D> StrSplit<'haystack, D> { | |
pub fn new(haystack: &'haystack str, delimiter: D) -> Self { | |
Self { | |
remainder: Some(haystack), | |
delimiter, | |
} | |
} | |
} | |
pub trait Delimiter { | |
fn find_next(&self, s: &str) -> Option<(usize, usize)>; | |
} | |
impl<'haystack, D> Iterator for StrSplit<'haystack, D> | |
where | |
D: Delimiter, | |
{ | |
type Item = &'haystack str; | |
fn next(&mut self) -> Option<Self::Item> { | |
let remainder = self.remainder.as_mut()?; | |
if let Some((delim_start, delim_end)) = self.delimiter.find_next(remainder) { | |
let until_delimiter = &remainder[..delim_start]; | |
*remainder = &remainder[delim_end..]; | |
Some(until_delimiter) | |
} else { | |
self.remainder.take() | |
} | |
} | |
} | |
impl Delimiter for &str { | |
fn find_next(&self, s: &str) -> Option<(usize, usize)> { | |
s.find(self).map(|start| (start, start + self.len())) | |
} | |
} | |
impl Delimiter for char { | |
fn find_next(&self, s: &str) -> Option<(usize, usize)> { | |
s.char_indices() | |
.find(|(_, c)| c == self) | |
.map(|(start, _)| (start, start + self.len_utf8())) | |
} | |
} | |
pub fn until_char(s: &str, c: char) -> &'_ str { | |
StrSplit::new(s, c) | |
.next() | |
.expect("StrSplit always gives at least one result") | |
} | |
#[test] | |
fn until_char_test() { | |
assert_eq!(until_char("hello world", 'o'), "hell"); | |
} | |
#[test] | |
fn it_works() { | |
let haystack = "a b c d e"; | |
let letters: Vec<_> = StrSplit::new(haystack, " ").collect(); | |
assert_eq!(letters, vec!["a", "b", "c", "d", "e"]); | |
} | |
#[test] | |
fn tail() { | |
let haystack = "a b c d "; | |
let letters: Vec<_> = StrSplit::new(haystack, " ").collect(); | |
assert_eq!(letters, vec!["a", "b", "c", "d", ""]); | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Something that might be worth noting here is that if the delimiter has length 0 (for example, an empty string), this will infinitely loop!
It will keep returning empty strings since the
remainder
never actually gets smaller in that case.I'm not actually sure how that should be handled though, as it looks like
""
patterns have non-standard behavior in the standard library: https://doc.rust-lang.org/std/primitive.str.html#impl-Pattern-for-%26strFor example:
Playground link: https://play.rust-lang.org/?version=stable&mode=debug&edition=2024&gist=5d009e96309f4f631bde4589d06f7cde
I don't think there is a trivially easy way to change the code in this gist to handle this off the top of my head, so I'll just leave this here for anyone curious!