blob: 6d0a68fc16db64f20a0833af7e461c8382f8ab69 [file] [log] [blame]
Denys Vlasenko2cdcb102014-03-05 18:56:20 +01001/* vi: set sw=4 ts=4: */
2/*
3 * shuf: Write a random permutation of the input lines to standard output.
4 *
5 * Copyright (C) 2014 by Bartosz Golaszewski <bartekgola@gmail.com>
6 *
7 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
8 */
9
10//config:config SHUF
11//config: bool "shuf"
12//config: default y
13//config: help
14//config: Generate random permutations
15
16//kbuild:lib-$(CONFIG_SHUF) += shuf.o
17//applet:IF_SHUF(APPLET_NOEXEC(shuf, shuf, BB_DIR_USR_BIN, BB_SUID_DROP, shuf))
18
19//usage:#define shuf_trivial_usage
Bartosz Golaszewski190693c2014-03-07 14:07:35 +010020//usage: "[-e|-i L-H] [-n NUM] [-o FILE] [-z] [FILE|ARG...]"
Denys Vlasenko2cdcb102014-03-05 18:56:20 +010021//usage:#define shuf_full_usage "\n\n"
Denys Vlasenko69f95672014-03-07 14:41:53 +010022//usage: "Randomly permute lines\n"
23//usage: "\n -e Treat ARGs as lines"
24//usage: "\n -i L-H Treat numbers L-H as lines"
Denys Vlasenko2cdcb102014-03-05 18:56:20 +010025//usage: "\n -n NUM Output at most NUM lines"
Denys Vlasenko69f95672014-03-07 14:41:53 +010026//usage: "\n -o FILE Write to FILE, not standard output"
Denys Vlasenko2cdcb102014-03-05 18:56:20 +010027//usage: "\n -z End lines with zero byte, not newline"
28
29#include "libbb.h"
30
31/* This is a NOEXEC applet. Be very careful! */
32
33#define OPT_e (1 << 0)
34#define OPT_i (1 << 1)
35#define OPT_n (1 << 2)
36#define OPT_o (1 << 3)
37#define OPT_z (1 << 4)
38#define OPT_STR "ei:n:o:z"
39
40/*
41 * Use the Fisher-Yates shuffle algorithm on an array of lines.
42 */
43static void shuffle_lines(char **lines, unsigned numlines)
44{
45 unsigned i;
46 unsigned r;
47 char *tmp;
48
49 srand(monotonic_us());
50
51 for (i = numlines-1; i > 0; i--) {
52 r = rand();
53 /* RAND_MAX can be as small as 32767 */
54 if (i > RAND_MAX)
55 r ^= rand() << 15;
56 r %= i;
57 tmp = lines[i];
58 lines[i] = lines[r];
59 lines[r] = tmp;
60 }
61}
62
63int shuf_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
64int shuf_main(int argc, char **argv)
65{
66 unsigned opts;
67 char *opt_i_str, *opt_n_str, *opt_o_str;
68 unsigned i;
69 char **lines;
70 unsigned numlines;
71 char eol;
72
73 opt_complementary = "e--i:i--e"; /* mutually exclusive */
74 opts = getopt32(argv, OPT_STR, &opt_i_str, &opt_n_str, &opt_o_str);
75
76 argc -= optind;
77 argv += optind;
78
79 /* Prepare lines for shuffling - either: */
80 if (opts & OPT_e) {
81 /* make lines from command-line arguments */
Denys Vlasenko2cdcb102014-03-05 18:56:20 +010082 numlines = argc;
83 lines = argv;
84 } else
85 if (opts & OPT_i) {
86 /* create a range of numbers */
87 char *dash;
88 unsigned lo, hi;
89
90 dash = strchr(opt_i_str, '-');
91 if (!dash) {
92 bb_error_msg_and_die("bad range '%s'", opt_i_str);
93 }
94 *dash = '\0';
95 lo = xatou(opt_i_str);
96 hi = xatou(dash + 1);
97 *dash = '-';
98 if (hi < lo) {
99 bb_error_msg_and_die("bad range '%s'", opt_i_str);
100 }
101
102 numlines = (hi+1) - lo;
103 lines = xmalloc(numlines * sizeof(lines[0]));
104 for (i = 0; i < numlines; i++) {
Denys Vlasenko102f0d02014-03-07 14:32:39 +0100105 lines[i] = (char*)(uintptr_t)lo;
Denys Vlasenko2cdcb102014-03-05 18:56:20 +0100106 lo++;
107 }
108 } else {
109 /* default - read lines from stdin or the input file */
110 FILE *fp;
111
112 if (argc > 1)
113 bb_show_usage();
114
115 fp = xfopen_stdin(argv[0] ? argv[0] : "-");
116 lines = NULL;
117 numlines = 0;
118 for (;;) {
119 char *line = xmalloc_fgetline(fp);
120 if (!line)
121 break;
122 lines = xrealloc_vector(lines, 6, numlines);
123 lines[numlines++] = line;
124 }
125 fclose_if_not_stdin(fp);
126 }
127
Bartosz Golaszewski58adbb52014-03-07 11:46:03 +0100128 if (numlines != 0)
129 shuffle_lines(lines, numlines);
Denys Vlasenko2cdcb102014-03-05 18:56:20 +0100130
131 if (opts & OPT_o)
132 xmove_fd(xopen(opt_o_str, O_WRONLY|O_CREAT|O_TRUNC), STDOUT_FILENO);
133
134 if (opts & OPT_n) {
135 unsigned maxlines;
136 maxlines = xatou(opt_n_str);
137 if (numlines > maxlines)
138 numlines = maxlines;
139 }
140
141 eol = '\n';
142 if (opts & OPT_z)
143 eol = '\0';
144
145 for (i = 0; i < numlines; i++) {
Denys Vlasenko102f0d02014-03-07 14:32:39 +0100146 if (opts & OPT_i)
147 printf("%u%c", (unsigned)(uintptr_t)lines[i], eol);
148 else
149 printf("%s%c", lines[i], eol);
Denys Vlasenko2cdcb102014-03-05 18:56:20 +0100150 }
151
152 fflush_stdout_and_exit(EXIT_SUCCESS);
153}