v/vlib/strings/strings.v

module strings

// import rand
// random returns a random string with `n` characters
/*
pub fn random(n int) string {
	buf := vmalloc(n)
	for i in 0..n {
		buf[i] = rand.next()
	}
	return tos(buf)
}
*/

// find_between_pair_byte returns the string found between the pair of marks defined
// by `start` and `end`.
// As opposed to the `find_between`, `all_after*`, `all_before*` methods defined on the
// `string` type, this function can extract content between *nested* marks in `input`.
// If `start` and `end` marks are nested in `input`, the characters
// between the *outermost* mark pair is returned. It is expected that `start` and `end`
// marks are *balanced*, meaning that the amount of `start` marks equal the
// amount of `end` marks in the `input`. An empty string is returned otherwise.
// Using two identical marks as `start` and `end` results in undefined output behavior.
// find_between_pair_byte is the fastest in the find_between_pair_* family of functions.
// Example: assert strings.find_between_pair_u8('(V) (NOT V)',`(`,`)`) == 'V'
// Example: assert strings.find_between_pair_u8('s {X{Y}} s',`{`,`}`) == 'X{Y}'
pub fn find_between_pair_u8(input string, start u8, end u8) string {
	mut marks := 0
	mut start_index := -1
	for i, b in input {
		if b == start {
			if start_index == -1 {
				start_index = i + 1
			}
			marks++
			continue
		}
		if start_index > 0 {
			if b == end {
				marks--
				if marks == 0 {
					return input[start_index..i]
				}
			}
		}
	}
	return ''
}

// find_between_pair_rune returns the string found between the pair of marks defined
// by `start` and `end`.
// As opposed to the `find_between`, `all_after*`, `all_before*` methods defined on the
// `string` type, this function can extract content between *nested* marks in `input`.
// If `start` and `end` marks are nested in `input`, the characters
// between the *outermost* mark pair is returned. It is expected that `start` and `end`
// marks are *balanced*, meaning that the amount of `start` marks equal the
// amount of `end` marks in the `input`. An empty string is returned otherwise.
// Using two identical marks as `start` and `end` results in undefined output behavior.
// find_between_pair_rune is inbetween the fastest and slowest in the find_between_pair_* family of functions.
// Example: assert strings.find_between_pair_rune('(V) (NOT V)',`(`,`)`) == 'V'
// Example: assert strings.find_between_pair_rune('s {X{Y}} s',`{`,`}`) == 'X{Y}'
pub fn find_between_pair_rune(input string, start rune, end rune) string {
	mut marks := 0
	mut start_index := -1
	runes := input.runes()
	for i, r in runes {
		if r == start {
			if start_index == -1 {
				start_index = i + 1
			}
			marks++
			continue
		}
		if start_index > 0 {
			if r == end {
				marks--
				if marks == 0 {
					return runes[start_index..i].string()
				}
			}
		}
	}
	return ''
}

// find_between_pair_string returns the string found between the pair of marks defined
// by `start` and `end`.
// As opposed to the `find_between`, `all_after*`, `all_before*` methods defined on the
// `string` type, this function can extract content between *nested* marks in `input`.
// If `start` and `end` marks are nested in `input`, the characters
// between the *outermost* mark pair is returned. It is expected that `start` and `end`
// marks are *balanced*, meaning that the amount of `start` marks equal the
// amount of `end` marks in the `input`. An empty string is returned otherwise.
// Using two identical marks as `start` and `end` results in undefined output behavior.
// find_between_pair_string is the slowest in the find_between_pair_* function family.
// Example: assert strings.find_between_pair_string('/*V*/ /*NOT V*/','/*','*/') == 'V'
// Example: assert strings.find_between_pair_string('s {{X{{Y}}}} s','{{','}}') == 'X{{Y}}'
pub fn find_between_pair_string(input string, start string, end string) string {
	mut start_index := -1
	mut marks := 0
	start_runes := start.runes()
	end_runes := end.runes()
	runes := input.runes()
	mut i := 0
	for ; i < runes.len; i++ {
		start_slice := runes#[i..i + start_runes.len]
		if start_slice == start_runes {
			i = i + start_runes.len - 1
			if start_index < 0 {
				start_index = i + 1
			}
			marks++
			continue
		}
		if start_index > 0 {
			end_slice := runes#[i..i + end_runes.len]
			if end_slice == end_runes {
				marks--
				if marks == 0 {
					return runes[start_index..i].string()
				}
				i = i + end_runes.len - 1
				continue
			}
		}
	}
	return ''
}

// split_capital returns an array containing the contents of `s` split by capital letters.
// Example: assert strings.split_capital('XYZ') == ['X', 'Y', 'Z']
// Example: assert strings.split_capital('XYStar') == ['X', 'Y', 'Star']
pub fn split_capital(s string) []string {
	mut res := []string{}
	mut word_start := 0
	for idx, c in s {
		if c >= `A` && c <= `Z` {
			if word_start != idx {
				res << s#[word_start..idx]
			}
			word_start = idx
			continue
		}
	}
	if word_start != s.len {
		res << s#[word_start..]
	}
	return res
}
vweb: fix duplicate fn error with multiple templates 2020-06-09 12:43:16 +02:00			`module strings`

strings: run v fmt (#7438) 2020-12-21 21:00:32 +01:00			`// import rand`
vweb: fix duplicate fn error with multiple templates 2020-06-09 12:43:16 +02:00			// random returns a random string with `n` characters
			`/*`
			`pub fn random(n int) string {`
			`buf := vmalloc(n)`
			`for i in 0..n {`
			`buf[i] = rand.next()`
			`}`
			`return tos(buf)`
			`}`
			`*/`
strings: add find_between_pair (#13468) 2022-02-15 14:12:15 +01:00
			`// find_between_pair_byte returns the string found between the pair of marks defined`
			// by `start` and `end`.
			// As opposed to the `find_between`, `all_after`, `all_before` methods defined on the
			// `string` type, this function can extract content between nested marks in `input`.
			// If `start` and `end` marks are nested in `input`, the characters
			// between the outermost mark pair is returned. It is expected that `start` and `end`
			// marks are balanced, meaning that the amount of `start` marks equal the
			// amount of `end` marks in the `input`. An empty string is returned otherwise.
			// Using two identical marks as `start` and `end` results in undefined output behavior.
			`// find_between_pair_byte is the fastest in the find_between_pair_* family of functions.`
all: byte => u8 2022-04-15 13:58:56 +02:00			// Example: assert strings.find_between_pair_u8('(V) (NOT V)',`(`,`)`) == 'V'
			// Example: assert strings.find_between_pair_u8('s {X{Y}} s',`{`,`}`) == 'X{Y}'
all: ~500 more byte=>u8 2022-04-15 17:25:45 +02:00			`pub fn find_between_pair_u8(input string, start u8, end u8) string {`
strings: add find_between_pair (#13468) 2022-02-15 14:12:15 +01:00			`mut marks := 0`
			`mut start_index := -1`
			`for i, b in input {`
			`if b == start {`
			`if start_index == -1 {`
			`start_index = i + 1`
			`}`
			`marks++`
			`continue`
			`}`
			`if start_index > 0 {`
			`if b == end {`
			`marks--`
			`if marks == 0 {`
			`return input[start_index..i]`
			`}`
			`}`
			`}`
			`}`
			`return ''`
			`}`

			`// find_between_pair_rune returns the string found between the pair of marks defined`
			// by `start` and `end`.
			// As opposed to the `find_between`, `all_after`, `all_before` methods defined on the
			// `string` type, this function can extract content between nested marks in `input`.
			// If `start` and `end` marks are nested in `input`, the characters
			// between the outermost mark pair is returned. It is expected that `start` and `end`
			// marks are balanced, meaning that the amount of `start` marks equal the
			// amount of `end` marks in the `input`. An empty string is returned otherwise.
			// Using two identical marks as `start` and `end` results in undefined output behavior.
			`// find_between_pair_rune is inbetween the fastest and slowest in the find_between_pair_* family of functions.`
			// Example: assert strings.find_between_pair_rune('(V) (NOT V)',`(`,`)`) == 'V'
			// Example: assert strings.find_between_pair_rune('s {X{Y}} s',`{`,`}`) == 'X{Y}'
			`pub fn find_between_pair_rune(input string, start rune, end rune) string {`
			`mut marks := 0`
			`mut start_index := -1`
			`runes := input.runes()`
			`for i, r in runes {`
			`if r == start {`
			`if start_index == -1 {`
			`start_index = i + 1`
			`}`
			`marks++`
			`continue`
			`}`
			`if start_index > 0 {`
			`if r == end {`
			`marks--`
			`if marks == 0 {`
			`return runes[start_index..i].string()`
			`}`
			`}`
			`}`
			`}`
			`return ''`
			`}`

			`// find_between_pair_string returns the string found between the pair of marks defined`
			// by `start` and `end`.
			// As opposed to the `find_between`, `all_after`, `all_before` methods defined on the
			// `string` type, this function can extract content between nested marks in `input`.
			// If `start` and `end` marks are nested in `input`, the characters
			// between the outermost mark pair is returned. It is expected that `start` and `end`
			// marks are balanced, meaning that the amount of `start` marks equal the
			// amount of `end` marks in the `input`. An empty string is returned otherwise.
			// Using two identical marks as `start` and `end` results in undefined output behavior.
			`// find_between_pair_string is the slowest in the find_between_pair_* function family.`
			`// Example: assert strings.find_between_pair_string('/V/ /NOT V/','/','/') == 'V'`
			`// Example: assert strings.find_between_pair_string('s {{X{{Y}}}} s','{{','}}') == 'X{{Y}}'`
			`pub fn find_between_pair_string(input string, start string, end string) string {`
			`mut start_index := -1`
			`mut marks := 0`
			`start_runes := start.runes()`
			`end_runes := end.runes()`
			`runes := input.runes()`
			`mut i := 0`
			`for ; i < runes.len; i++ {`
			`start_slice := runes#[i..i + start_runes.len]`
			`if start_slice == start_runes {`
			`i = i + start_runes.len - 1`
			`if start_index < 0 {`
			`start_index = i + 1`
			`}`
			`marks++`
			`continue`
			`}`
			`if start_index > 0 {`
			`end_slice := runes#[i..i + end_runes.len]`
			`if end_slice == end_runes {`
			`marks--`
			`if marks == 0 {`
			`return runes[start_index..i].string()`
			`}`
			`i = i + end_runes.len - 1`
			`continue`
			`}`
			`}`
			`}`
			`return ''`
			`}`
strings: add split_capital (#14716) 2022-06-07 17:43:06 +02:00
			// split_capital returns an array containing the contents of `s` split by capital letters.
			`// Example: assert strings.split_capital('XYZ') == ['X', 'Y', 'Z']`
			`// Example: assert strings.split_capital('XYStar') == ['X', 'Y', 'Star']`
			`pub fn split_capital(s string) []string {`
			`mut res := []string{}`
			`mut word_start := 0`
			`for idx, c in s {`
			if c >= `A` && c <= `Z` {
			`if word_start != idx {`
			`res << s#[word_start..idx]`
			`}`
			`word_start = idx`
			`continue`
			`}`
			`}`
			`if word_start != s.len {`
			`res << s#[word_start..]`
			`}`
			`return res`
			`}`