David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 1 | use nom::IResult; |
| 2 | use unicode_xid::UnicodeXID; |
| 3 | |
| 4 | pub fn whitespace(input: &str) -> IResult<&str, ()> { |
| 5 | if input.is_empty() { |
| 6 | return IResult::Error; |
| 7 | } |
| 8 | |
David Tolnay | 318195d | 2016-10-08 11:34:19 -0700 | [diff] [blame] | 9 | let bytes = input.as_bytes(); |
| 10 | let mut i = 0; |
| 11 | while i < bytes.len() { |
| 12 | let s = &input[i..]; |
| 13 | if bytes[i] == b'/' { |
David Tolnay | daaf774 | 2016-10-03 11:11:43 -0700 | [diff] [blame] | 14 | if s.starts_with("//") && (!s.starts_with("///") || s.starts_with("////")) && |
| 15 | !s.starts_with("//!") { |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 16 | if let Some(len) = s.find('\n') { |
David Tolnay | 318195d | 2016-10-08 11:34:19 -0700 | [diff] [blame] | 17 | i += len + 1; |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 18 | continue; |
| 19 | } |
| 20 | break; |
David Tolnay | daaf774 | 2016-10-03 11:11:43 -0700 | [diff] [blame] | 21 | } else if s.starts_with("/*") && !s.starts_with("/**") && !s.starts_with("/*!") { |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 22 | match block_comment(s) { |
| 23 | IResult::Done(_, com) => { |
David Tolnay | 318195d | 2016-10-08 11:34:19 -0700 | [diff] [blame] | 24 | i += com.len(); |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 25 | continue; |
| 26 | } |
| 27 | IResult::Error => { |
| 28 | return IResult::Error; |
| 29 | } |
| 30 | } |
| 31 | } |
| 32 | } |
David Tolnay | 318195d | 2016-10-08 11:34:19 -0700 | [diff] [blame] | 33 | match bytes[i] { |
| 34 | b' ' | 0x09...0x0d => { |
| 35 | i += 1; |
| 36 | continue; |
| 37 | } |
David Tolnay | 3bcfb72 | 2016-10-08 11:58:36 -0700 | [diff] [blame^] | 38 | b if b <= 0x7f => {} |
David Tolnay | 318195d | 2016-10-08 11:34:19 -0700 | [diff] [blame] | 39 | _ => { |
| 40 | let ch = s.chars().next().unwrap(); |
| 41 | if ch.is_whitespace() { |
| 42 | i += ch.len_utf8(); |
| 43 | continue; |
| 44 | } |
| 45 | } |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 46 | } |
David Tolnay | 318195d | 2016-10-08 11:34:19 -0700 | [diff] [blame] | 47 | return if i > 0 { |
| 48 | IResult::Done(s, ()) |
| 49 | } else { |
| 50 | IResult::Error |
| 51 | }; |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 52 | } |
| 53 | IResult::Done("", ()) |
| 54 | } |
| 55 | |
| 56 | pub fn block_comment(input: &str) -> IResult<&str, &str> { |
| 57 | if !input.starts_with("/*") { |
| 58 | return IResult::Error; |
| 59 | } |
| 60 | |
| 61 | let mut depth = 0; |
David Tolnay | 079b5ad | 2016-10-08 09:39:29 -0700 | [diff] [blame] | 62 | let bytes = input.as_bytes(); |
| 63 | let mut i = 0; |
| 64 | let upper = bytes.len() - 1; |
| 65 | while i < upper { |
| 66 | if bytes[i] == b'/' && bytes[i + 1] == b'*' { |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 67 | depth += 1; |
David Tolnay | 079b5ad | 2016-10-08 09:39:29 -0700 | [diff] [blame] | 68 | i += 1; // eat '*' |
| 69 | } else if bytes[i] == b'*' && bytes[i + 1] == b'/' { |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 70 | depth -= 1; |
| 71 | if depth == 0 { |
| 72 | return IResult::Done(&input[i + 2..], &input[..i + 2]); |
| 73 | } |
David Tolnay | 079b5ad | 2016-10-08 09:39:29 -0700 | [diff] [blame] | 74 | i += 1; // eat '/' |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 75 | } |
David Tolnay | 079b5ad | 2016-10-08 09:39:29 -0700 | [diff] [blame] | 76 | i += 1; |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 77 | } |
| 78 | IResult::Error |
| 79 | } |
| 80 | |
| 81 | pub fn word_break(input: &str) -> IResult<&str, ()> { |
| 82 | match input.chars().next() { |
David Tolnay | daaf774 | 2016-10-03 11:11:43 -0700 | [diff] [blame] | 83 | Some(ch) if UnicodeXID::is_xid_continue(ch) => IResult::Error, |
| 84 | Some(_) | None => IResult::Done(input, ()), |
David Tolnay | 14cbdeb | 2016-10-01 12:13:59 -0700 | [diff] [blame] | 85 | } |
| 86 | } |