Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 1 | /* vi: set sw=4 ts=4: */ |
| 2 | /* |
| 3 | * split - split a file into pieces |
| 4 | * Copyright (c) 2007 Bernhard Fischer |
| 5 | * |
| 6 | * Licensed under GPLv2 or later, see file LICENSE in this tarball for details. |
| 7 | */ |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 8 | /* BB_AUDIT: SUSv3 compliant |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 9 | * SUSv3 requirements: |
| 10 | * http://www.opengroup.org/onlinepubs/009695399/utilities/split.html |
| 11 | */ |
| 12 | #include "busybox.h" |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 13 | |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 14 | static const struct suffix_mult split_suffices[] = { |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 15 | #if ENABLE_FEATURE_SPLIT_FANCY |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 16 | { "b", 512 }, |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 17 | #endif |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 18 | { "k", 1024 }, |
| 19 | { "m", 1024*1024 }, |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 20 | #if ENABLE_FEATURE_SPLIT_FANCY |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 21 | { "g", 1024*1024*1024 }, |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 22 | #endif |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 23 | { NULL, 0 } |
| 24 | }; |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 25 | |
| 26 | /* Increment the suffix part of the filename. |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 27 | * Returns NULL if we are out of filenames. |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 28 | */ |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 29 | static char *next_file(char *old, unsigned suffix_len) |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 30 | { |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 31 | size_t end = strlen(old); |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 32 | unsigned i = 1; |
| 33 | char *curr; |
| 34 | |
| 35 | do { |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 36 | curr = old + end - i; |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 37 | if (*curr < 'z') { |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 38 | *curr += 1; |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 39 | break; |
| 40 | } |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 41 | i++; |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 42 | if (i > suffix_len) { |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 43 | return NULL; |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 44 | } |
| 45 | *curr = 'a'; |
Bernhard Reutner-Fischer | 576de34 | 2007-03-26 18:19:29 +0000 | [diff] [blame] | 46 | } while (1); |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 47 | |
| 48 | return old; |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 49 | } |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 50 | |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 51 | #define read_buffer bb_common_bufsiz1 |
| 52 | enum { READ_BUFFER_SIZE = sizeof(bb_common_bufsiz1) - 1 }; |
| 53 | |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 54 | #define SPLIT_OPT_l (1<<0) |
| 55 | #define SPLIT_OPT_b (1<<1) |
Bernhard Reutner-Fischer | cd43dfd | 2007-03-26 10:46:31 +0000 | [diff] [blame] | 56 | #define SPLIT_OPT_a (1<<2) |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 57 | |
| 58 | int split_main(int argc, char **argv); |
| 59 | int split_main(int argc, char **argv) |
| 60 | { |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 61 | unsigned suffix_len = 2; |
| 62 | char *pfx; |
| 63 | char *count_p; |
| 64 | const char *sfx; |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 65 | off_t cnt = 1000; |
| 66 | off_t remaining = 0; |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 67 | unsigned opt; |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 68 | ssize_t bytes_read, to_write; |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 69 | char *src; |
| 70 | |
| 71 | opt_complementary = "?2"; |
Bernhard Reutner-Fischer | 576de34 | 2007-03-26 18:19:29 +0000 | [diff] [blame] | 72 | opt = getopt32(argc, argv, "l:b:a:", &count_p, &count_p, &sfx); |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 73 | |
Bernhard Reutner-Fischer | 576de34 | 2007-03-26 18:19:29 +0000 | [diff] [blame] | 74 | if (opt & SPLIT_OPT_l) |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 75 | cnt = xatoul(count_p); |
Bernhard Reutner-Fischer | 576de34 | 2007-03-26 18:19:29 +0000 | [diff] [blame] | 76 | if (opt & SPLIT_OPT_b) |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 77 | cnt = xatoul_sfx(count_p, split_suffices); |
Bernhard Reutner-Fischer | 576de34 | 2007-03-26 18:19:29 +0000 | [diff] [blame] | 78 | if (opt & SPLIT_OPT_a) |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 79 | suffix_len = xatou(sfx); |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 80 | sfx = "x"; |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 81 | |
| 82 | argv += optind; |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 83 | if (argv[0]) { |
| 84 | if (argv[1]) |
| 85 | sfx = argv[1]; |
| 86 | xmove_fd(xopen(argv[0], O_RDONLY), 0); |
| 87 | } else { |
| 88 | argv[0] = (char *) bb_msg_standard_input; |
| 89 | } |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 90 | |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 91 | if (NAME_MAX < strlen(sfx) + suffix_len) |
| 92 | bb_error_msg_and_die("suffix too long"); |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 93 | |
| 94 | { |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 95 | char *char_p = xzalloc(suffix_len + 1); |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 96 | memset(char_p, 'a', suffix_len); |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 97 | pfx = xasprintf("%s%s", sfx, char_p); |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 98 | if (ENABLE_FEATURE_CLEAN_UP) |
| 99 | free(char_p); |
| 100 | } |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 101 | |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 102 | while (1) { |
| 103 | bytes_read = safe_read(0, read_buffer, READ_BUFFER_SIZE); |
| 104 | if (!bytes_read) |
| 105 | break; |
| 106 | if (bytes_read < 0) |
| 107 | bb_perror_msg_and_die("%s", argv[0]); |
| 108 | src = read_buffer; |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 109 | do { |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 110 | if (!remaining) { |
| 111 | if (!pfx) |
Bernhard Reutner-Fischer | 0a537a0 | 2007-03-28 16:48:40 +0000 | [diff] [blame^] | 112 | bb_error_msg_and_die("suffixes exhausted"); |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 113 | xmove_fd(xopen(pfx, O_WRONLY | O_CREAT | O_TRUNC), 1); |
| 114 | pfx = next_file(pfx, suffix_len); |
| 115 | remaining = cnt; |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 116 | } |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 117 | |
| 118 | if (opt & SPLIT_OPT_b) { |
| 119 | /* split by bytes */ |
| 120 | to_write = (bytes_read < remaining) ? bytes_read : remaining; |
| 121 | remaining -= to_write; |
| 122 | } else { |
| 123 | /* split by lines */ |
| 124 | /* can be sped up by using _memrchr_ |
| 125 | * and writing many lines at once... */ |
| 126 | char *end = memchr(src, '\n', bytes_read); |
| 127 | if (end) { |
| 128 | --remaining; |
| 129 | to_write = end - src + 1; |
| 130 | } else { |
| 131 | to_write = bytes_read; |
| 132 | } |
Bernhard Reutner-Fischer | b813eaf | 2007-03-26 14:28:12 +0000 | [diff] [blame] | 133 | } |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 134 | |
| 135 | xwrite(1, src, to_write); |
| 136 | bytes_read -= to_write; |
| 137 | src += to_write; |
| 138 | } while (bytes_read); |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 139 | } |
Denis Vlasenko | 91dd275 | 2007-03-26 20:15:40 +0000 | [diff] [blame] | 140 | return 0; |
Bernhard Reutner-Fischer | 10f8f5f | 2007-03-25 21:50:18 +0000 | [diff] [blame] | 141 | } |