aboutsummaryrefslogtreecommitdiffhomepage
path: root/doc_src/string.txt
blob: 2996b4565c348894dfaa53caea9b2486b56dd607 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
\section string string - manipulate strings

\subsection string-synopsis Synopsis
\fish{synopsis}
string length [(-q | --quiet)] [STRING...]
string sub [(-s | --start) START] [(-l | --length) LENGTH] [(-q | --quiet)]
           [STRING...]
string split [(-m | --max) MAX] [(-r | --right)] [(-q | --quiet)] SEP
             [STRING...]
string join [(-q | --quiet)] SEP [STRING...]
string trim [(-l | --left)] [(-r | --right)] [(-c | --chars CHARS)]
            [(-q | --quiet)] [STRING...]
string escape [(-n | --no-quoted)] [STRING...]
string match [(-a | --all)] [(-i | --ignore-case)] [(-r | --regex)]
             [(-n | --index)] [(-q | --quiet)] [(-v | --invert)] PATTERN [STRING...]
string replace [(-a | --all)] [(-i | --ignore-case)] [(-r | --regex)]
               [(-q | --quiet)] PATTERN REPLACEMENT [STRING...]
\endfish


\subsection string-description Description

`string` performs operations on strings.

STRING arguments are taken from the command line unless standard input is connected to a pipe or a file, in which case they are read from standard input, one STRING per line. It is an error to supply STRING arguments on the command line and on standard input.

Arguments beginning with `-` are normally interpreted as switches; `--` causes the following arguments not to be treated as switches even if they begin with `-`. Switches and required arguments are recognized only on the command line.

Most subcommands accept a `-q` or `--quiet` switch, which suppresses the usual output but exits with the documented status.

In addition to the exit codes documented below, all the string subcommands exit with a value of 2 to indicate that an error occurred.

The following subcommands are available:

- `length` reports the length of each string argument in characters. Exit status: 0 if at least one non-empty STRING was given, or 1 otherwise.

- `sub` prints a substring of each string argument. The start of the substring can be specified with `-s` or `--start` followed by a 1-based index value. Positive index values are relative to the start of the string and negative index values are relative to the end of the string. The default start value is 1. The length of the substring can be specified with `-l` or `--length`. If the length is not specified, the substring continues to the end of each STRING. Exit status: 0 if at least one substring operation was performed, 1 otherwise.

- `split` splits each STRING on the separator SEP, which can be an empty string. If `-m` or `--max` is specified, at most MAX splits are done on each STRING. If `-r` or `--right` is given, splitting is performed right-to-left. This is useful in combination with `-m` or `--max`. Exit status: 0 if at least one split was performed, or 1 otherwise.

- `join` joins its STRING arguments into a single string separated by SEP, which can be an empty string. Exit status: 0 if at least one join was performed, or 1 otherwise.

- `trim` removes leading and trailing whitespace from each STRING. If `-l` or `--left` is given, only leading whitespace is removed. If `-r` or `--right` is given, only trailing whitespace is trimmed. The `-c` or `--chars` switch causes the characters in CHARS to be removed instead of whitespace. Exit status: 0 if at least one character was trimmed, or 1 otherwise.

- `escape` escapes each STRING such that it can be passed back to `eval` to produce the original argument again. By default, all special characters are escaped, and quotes are used to simplify the output when possible. If `-n` or `--no-quote` is given, the simplifying quoted format is not used. Exit status: 0 if at least one string was escaped, or 1 otherwise.

- `match` tests each STRING against PATTERN and prints matching substrings. Only the first match for each STRING is reported unless `-a` or `--all` is given, in which case all matches are reported. Matching can be made case-insensitive with `-i` or `--ignore-case`. If `-n` or `--index` is given, each match is reported as a 1-based start position and a length. By default, PATTERN is interpreted as a glob pattern matched against each entire STRING argument. A glob pattern is only considered a valid match if it matches the entire STRING. If `-r` or `--regex` is given, PATTERN is interpreted as a Perl-compatible regular expression, which does not have to match the entire STRING. For a regular expression containing capturing groups, multiple items will be reported for each match, one for the entire match and one for each capturing group. If --invert or -v is used the selected lines will be only those which do not match the given glob pattern or regular expression.  Exit status: 0 if at least one match was found, or 1 otherwise.

- `replace` is similar to `match` but replaces non-overlapping matching substrings with a replacement string and prints the result. By default, PATTERN is treated as a literal substring to be matched. If `-r` or `--regex` is given, PATTERN is interpreted as a Perl-compatible regular expression, and REPLACEMENT can contain C-style escape sequences like `\t` as well as references to capturing groups by number or name as `$n` or `${n}`. Exit status: 0 if at least one replacement was performed, or 1 otherwise.

\subsection regular-expressions Regular Expressions

Both the `match` and `replace` subcommand support regular expressions when used with the `-r` or `--regex` option. The dialect is that of PCRE2.

In general, special characters are special by default, so `a+` matches one or more "a"s, while `a\+` matches an "a" and then a "+". `(a+)` matches one or more "a"s in a capturing group (`(?:XXXX)` denotes a non-capturing group). For the replacement parameter of `replace`, `$n` refers to the n-th group of the match. In the match parameter, `\n` (e.g. `\1`) refers back to groups.

\subsection string-example Examples

\fish{cli-dark}
>_ string length 'hello, world'
\outp{12}

>_ set str foo
>_ string length -q $str; echo $status
0
# Equivalent to test -n $str
\endfish

\fish{cli-dark}
>_ string sub --length 2 abcde
\outp{ab}

>_ string sub -s 2 -l 2 abcde
\outp{bc}

>_ string sub --start=-2 abcde
\outp{de}
\endfish

\fish{cli-dark}
>_ string split . example.com
\outp{example}
\outp{com}

>_ string split -r -m1 / /usr/local/bin/fish
\outp{/usr/local/bin}
\outp{fish}

>_ string split '' abc
\outp{a}
\outp{b}
\outp{c}
\endfish

\fish{cli-dark}
>_ seq 3 | string join ...
\outp{1...2...3}
\endfish

\fish{cli-dark}
>_ string trim ' abc  '
\outp{abc}

>_ string trim --right --chars=yz xyzzy zany
\outp{x}
\outp{zan}
\endfish

\fish{cli-dark}
>_ echo \\x07 | string escape
\bksl{cg}
\endfish

\subsection string-example-match-glob Match Glob Examples

\fish{cli-dark}
>_ string match '?' a
\outp{a}

>_ string match 'a*b' axxb
\outp{axxb}

>_ string match -i 'a??B' Axxb
\outp{Axxb}

>_ echo 'ok?' | string match '*\\?'
>_ \outp{ok?}

\subsection string-example-match-regex Match Regex Examples

\fish{cli-dark}
>_ string match -r 'cat|dog|fish' 'nice dog'
\outp{dog}

>_ string match -r -v "c.*[12]" {cat,dog}(seq 1 4)
\outp{dog1}
\outp{dog2}
\outp{cat3}
\outp{dog3}
\outp{cat4}
\outp{dog4}
\endfish

>_ string match -r '(\\d\\d?):(\\d\\d):(\\d\\d)' \asis{2:34:56}
\outp{2:34:56}
\outp{2}
\outp{34}
\outp{56}

>_ string match -r '^(\\w{{2,4}})\\g1$' papa mud murmur
\outp{papa}
\outp{pa}
\outp{murmur}
\outp{mur}

>_ string match -r -a -n at ratatat
\outp{2 2}
\outp{4 2}
\outp{6 2}

>_ string match -r -i '0x[0-9a-f]{{1,8}}' 'int magic = 0xBadC0de;'
\outp{0xBadC0de}
\endfish

\subsection string-example-replace-literal Replace Literal Examples

\fish{cli-dark}
>_ string replace is was 'blue is my favorite'
\outp{blue was my favorite}

>_ string replace 3rd last 1st 2nd 3rd
\outp{1st}
\outp{2nd}
\outp{last}

>_ string replace -a ' ' _ 'spaces to underscores'
\outp{spaces_to_underscores}
\endfish

\subsection string-example-replace-Regex Replace Regex Examples

\fish{cli-dark}
>_ string replace -r -a '[^\\d.]+' ' ' '0 one two 3.14 four 5x'
\outp{0 3.14 5}

>_ string replace -r '(\\w+)\\s+(\\w+)' '$2 $1 $$' 'left right'
\outp{right left $}

>_ string replace -r '\\s*newline\\s*' '\\n' 'put a newline here'
\outp{put a}
\outp{here}
\endfish