1
2
3
4
5
6
7
8
9
10
11
12#include "libbb.h"
13
14
15
16
17
18static const char optstring[] ALIGN1 = "b:c:f:d:sn";
19#define CUT_OPT_BYTE_FLGS (1 << 0)
20#define CUT_OPT_CHAR_FLGS (1 << 1)
21#define CUT_OPT_FIELDS_FLGS (1 << 2)
22#define CUT_OPT_DELIM_FLGS (1 << 3)
23#define CUT_OPT_SUPPRESS_FLGS (1 << 4)
24
25struct cut_list {
26 int startpos;
27 int endpos;
28};
29
30enum {
31 BOL = 0,
32 EOL = INT_MAX,
33 NON_RANGE = -1
34};
35
36static int cmpfunc(const void *a, const void *b)
37{
38 return (((struct cut_list *) a)->startpos -
39 ((struct cut_list *) b)->startpos);
40
41}
42
43static void cut_file(FILE *file, char delim, const struct cut_list *cut_lists, unsigned nlists)
44{
45 char *line;
46 unsigned linenum = 0;
47
48
49 while ((line = xmalloc_fgetline(file)) != NULL) {
50
51
52 int linelen = strlen(line);
53 char *printed = xzalloc(linelen + 1);
54 char *orig_line = line;
55 unsigned cl_pos = 0;
56 int spos;
57
58
59 if (option_mask32 & (CUT_OPT_CHAR_FLGS | CUT_OPT_BYTE_FLGS)) {
60
61 for (; cl_pos < nlists; cl_pos++) {
62 spos = cut_lists[cl_pos].startpos;
63 while (spos < linelen) {
64 if (!printed[spos]) {
65 printed[spos] = 'X';
66 putchar(line[spos]);
67 }
68 spos++;
69 if (spos > cut_lists[cl_pos].endpos
70
71
72
73 ) {
74 break;
75 }
76 }
77 }
78 } else if (delim == '\n') {
79 spos = cut_lists[cl_pos].startpos;
80
81
82
83 if (((int)linenum < spos) || (cl_pos >= nlists))
84 goto next_line;
85
86
87
88 while (spos < (int)linenum) {
89 spos++;
90
91 if (spos > cut_lists[cl_pos].endpos
92 || cut_lists[cl_pos].endpos == NON_RANGE
93 ) {
94 cl_pos++;
95
96 if (cl_pos >= nlists)
97 goto next_line;
98 spos = cut_lists[cl_pos].startpos;
99
100
101 if ((int)linenum < spos)
102 goto next_line;
103 }
104 }
105
106
107
108 puts(line);
109 goto next_line;
110 } else {
111 int ndelim = -1;
112 int nfields_printed = 0;
113 char *field = NULL;
114 const char delimiter[2] = { delim, 0 };
115
116
117 if (strchr(line, delim) == NULL) {
118 if (!(option_mask32 & CUT_OPT_SUPPRESS_FLGS))
119 puts(line);
120 goto next_line;
121 }
122
123
124
125 for (; cl_pos < nlists && line; cl_pos++) {
126 spos = cut_lists[cl_pos].startpos;
127 do {
128
129 while (line && ndelim < spos) {
130 field = strsep(&line, delimiter);
131 ndelim++;
132 }
133
134
135 if (field && ndelim == spos && !printed[ndelim]) {
136
137
138
139 if (nfields_printed > 0)
140 putchar(delim);
141 fputs(field, stdout);
142 printed[ndelim] = 'X';
143 nfields_printed++;
144 }
145
146 spos++;
147
148
149
150
151 } while (spos <= cut_lists[cl_pos].endpos && line
152 && cut_lists[cl_pos].endpos != NON_RANGE);
153 }
154 }
155
156
157 putchar('\n');
158 next_line:
159 linenum++;
160 free(printed);
161 free(orig_line);
162 }
163}
164
165int cut_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
166int cut_main(int argc UNUSED_PARAM, char **argv)
167{
168
169 struct cut_list *cut_lists = NULL;
170 unsigned nlists = 0;
171 char delim = '\t';
172 char *sopt, *ltok;
173 unsigned opt;
174
175 opt_complementary = "b--bcf:c--bcf:f--bcf";
176 opt = getopt32(argv, optstring, &sopt, &sopt, &sopt, <ok);
177
178 argv += optind;
179 if (!(opt & (CUT_OPT_BYTE_FLGS | CUT_OPT_CHAR_FLGS | CUT_OPT_FIELDS_FLGS)))
180 bb_error_msg_and_die("expected a list of bytes, characters, or fields");
181
182 if (opt & CUT_OPT_DELIM_FLGS) {
183 if (ltok[0] && ltok[1]) {
184 bb_error_msg_and_die("the delimiter must be a single character");
185 }
186 delim = ltok[0];
187 }
188
189
190 if (!(opt & CUT_OPT_FIELDS_FLGS)) {
191 static const char _op_on_field[] ALIGN1 = " only when operating on fields";
192
193 if (opt & CUT_OPT_SUPPRESS_FLGS) {
194 bb_error_msg_and_die
195 ("suppressing non-delimited lines makes sense%s",
196 _op_on_field);
197 }
198 if (delim != '\t') {
199 bb_error_msg_and_die
200 ("a delimiter may be specified%s", _op_on_field);
201 }
202 }
203
204
205
206
207
208
209 {
210 char *ntok;
211 int s = 0, e = 0;
212
213
214 while ((ltok = strsep(&sopt, ",")) != NULL) {
215
216
217 if (!ltok[0])
218 continue;
219
220
221 ntok = strsep(<ok, "-");
222 if (!ntok[0]) {
223 s = BOL;
224 } else {
225 s = xatoi_u(ntok);
226
227
228 if (s != 0)
229 s--;
230 }
231
232
233 if (ltok == NULL) {
234 e = NON_RANGE;
235 } else if (!ltok[0]) {
236 e = EOL;
237 } else {
238 e = xatoi_u(ltok);
239
240
241 if (e == 0)
242 e = EOL;
243 e--;
244 if (e == s)
245 e = NON_RANGE;
246 }
247
248
249 cut_lists = xrealloc_vector(cut_lists, 4, nlists);
250
251
252 cut_lists[nlists].startpos = s;
253 cut_lists[nlists].endpos = e;
254 nlists++;
255 }
256
257
258 if (nlists == 0)
259 bb_error_msg_and_die("missing list of positions");
260
261
262
263
264 qsort(cut_lists, nlists, sizeof(struct cut_list), cmpfunc);
265 }
266
267 {
268 int retval = EXIT_SUCCESS;
269
270 if (!*argv)
271 *--argv = (char *)"-";
272
273 do {
274 FILE *file = fopen_or_warn_stdin(*argv);
275 if (!file) {
276 retval = EXIT_FAILURE;
277 continue;
278 }
279 cut_file(file, delim, cut_lists, nlists);
280 fclose_if_not_stdin(file);
281 } while (*++argv);
282
283 if (ENABLE_FEATURE_CLEAN_UP)
284 free(cut_lists);
285 fflush_stdout_and_exit(retval);
286 }
287}
288