logo

utils-std

Collection of commonly available Unix tools git clone https://anongit.hacktivis.me/git/utils-std.git/

paste.c (6227B)


  1. /*-
  2. * SPDX-License-Identifier: BSD-3-Clause
  3. *
  4. * Copyright (c) 1989, 1993
  5. * The Regents of the University of California. All rights reserved.
  6. *
  7. * This code is derived from software contributed to Berkeley by
  8. * Adam S. Moskowitz of Menlo Consulting.
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions
  12. * are met:
  13. * 1. Redistributions of source code must retain the above copyright
  14. * notice, this list of conditions and the following disclaimer.
  15. * 2. Redistributions in binary form must reproduce the above copyright
  16. * notice, this list of conditions and the following disclaimer in the
  17. * documentation and/or other materials provided with the distribution.
  18. * 3. Neither the name of the University nor the names of its contributors
  19. * may be used to endorse or promote products derived from this software
  20. * without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  23. * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  26. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  27. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  28. * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  29. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  30. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  31. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  32. * SUCH DAMAGE.
  33. */
  34. #define _POSIX_C_SOURCE 200809L
  35. #include "../lib/err.h"
  36. #include "../lib/getopt_nolong.h"
  37. #include <errno.h>
  38. #include <limits.h>
  39. #include <locale.h>
  40. #include <stdint.h> // SIZE_MAX
  41. #include <stdio.h>
  42. #include <stdlib.h>
  43. #include <string.h>
  44. #include <sys/types.h>
  45. #include <unistd.h>
  46. #include <wchar.h>
  47. static wchar_t *delim;
  48. static int delimcnt;
  49. static wint_t linedelim = L'\n';
  50. static wchar_t tab[] = L"\t";
  51. const char *argv0 = "paste";
  52. typedef struct _list
  53. {
  54. struct _list *next;
  55. FILE *fp;
  56. int cnt;
  57. char *name;
  58. } LIST;
  59. static int
  60. parallel(char **argv)
  61. {
  62. LIST *lp;
  63. int cnt;
  64. wint_t ich;
  65. wchar_t ch;
  66. char *p;
  67. LIST *head, *tmp;
  68. int opencnt, output;
  69. for(cnt = 0, head = tmp = NULL; (p = *argv); ++argv, ++cnt)
  70. {
  71. if((lp = malloc(sizeof(LIST))) == NULL) utils_err(1, NULL);
  72. if(p[0] == '-' && !p[1])
  73. lp->fp = stdin;
  74. else if(!(lp->fp = fopen(p, "r")))
  75. utils_err(1, "%s", p);
  76. lp->next = NULL;
  77. lp->cnt = cnt;
  78. lp->name = p;
  79. if(!head)
  80. head = tmp = lp;
  81. else
  82. {
  83. tmp->next = lp;
  84. tmp = lp;
  85. }
  86. }
  87. for(opencnt = cnt; opencnt;)
  88. {
  89. for(output = 0, lp = head; lp; lp = lp->next)
  90. {
  91. if(!lp->fp)
  92. {
  93. if(output && lp->cnt && (ch = delim[(lp->cnt - 1) % delimcnt])) putwchar(ch);
  94. continue;
  95. }
  96. if((ich = getwc(lp->fp)) == WEOF)
  97. {
  98. if(!--opencnt) break;
  99. lp->fp = NULL;
  100. if(output && lp->cnt && (ch = delim[(lp->cnt - 1) % delimcnt])) putwchar(ch);
  101. continue;
  102. }
  103. /*
  104. * make sure that we don't print any delimiters
  105. * unless there's a non-empty file.
  106. */
  107. if(!output)
  108. {
  109. output = 1;
  110. for(cnt = 0; cnt < lp->cnt; ++cnt)
  111. if((ch = delim[cnt % delimcnt])) putwchar(ch);
  112. }
  113. else if((ch = delim[(lp->cnt - 1) % delimcnt]))
  114. putwchar(ch);
  115. if(ich == linedelim) continue;
  116. do
  117. {
  118. putwchar(ich);
  119. } while((ich = getwc(lp->fp)) != WEOF && ich != linedelim);
  120. }
  121. if(output) putwchar(linedelim);
  122. }
  123. return (0);
  124. }
  125. static int
  126. sequential(char **argv)
  127. {
  128. FILE *fp;
  129. int cnt, failed, needdelim;
  130. wint_t ch;
  131. char *p;
  132. failed = 0;
  133. for(; (p = *argv); ++argv)
  134. {
  135. if(p[0] == '-' && !p[1])
  136. fp = stdin;
  137. else if(!(fp = fopen(p, "r")))
  138. {
  139. utils_warn("%s", p);
  140. failed = 1;
  141. continue;
  142. }
  143. cnt = needdelim = 0;
  144. while((ch = getwc(fp)) != WEOF)
  145. {
  146. if(needdelim)
  147. {
  148. needdelim = 0;
  149. if(delim[cnt] != '\0') putwchar(delim[cnt]);
  150. if(++cnt == delimcnt) cnt = 0;
  151. }
  152. if(ch != linedelim)
  153. putwchar(ch);
  154. else
  155. needdelim = 1;
  156. }
  157. if(needdelim) putwchar(linedelim);
  158. if(fp != stdin) (void)fclose(fp);
  159. }
  160. return (failed != 0);
  161. }
  162. static int
  163. tr(wchar_t *arg)
  164. {
  165. int cnt;
  166. wchar_t ch, *p;
  167. for(p = arg, cnt = 0; (ch = *p++); ++arg, ++cnt)
  168. if(ch == '\\') switch(ch = *p++)
  169. {
  170. case 'n':
  171. *arg = '\n';
  172. break;
  173. case 't':
  174. *arg = '\t';
  175. break;
  176. case '0':
  177. *arg = '\0';
  178. break;
  179. default:
  180. *arg = ch;
  181. break;
  182. }
  183. else
  184. *arg = ch;
  185. if(!cnt) utils_errx(1, "no delimiters specified");
  186. return (cnt);
  187. }
  188. static void
  189. usage(void)
  190. {
  191. (void)fprintf(stderr, "usage: paste [-sz] [-d delimiters] [file...]\n");
  192. exit(1);
  193. }
  194. int
  195. main(int argc, char *argv[])
  196. {
  197. char *lc_all = setlocale(LC_ALL, "");
  198. if(lc_all == NULL)
  199. {
  200. fprintf(stderr,
  201. "%s: warning: Failed loading locales. setlocale(LC_ALL, \"\"): %s\n",
  202. argv0,
  203. strerror(errno));
  204. }
  205. errno = 0;
  206. int seq = 0;
  207. for(int c = -1; (c = getopt_nolong(argc, argv, ":d:sz")) != -1;)
  208. {
  209. switch(c)
  210. {
  211. case 'd':
  212. {
  213. const char *arg = optarg;
  214. size_t len = mbsrtowcs(NULL, &arg, 0, NULL);
  215. if(len == (size_t)-1) utils_err(1, "delimiters");
  216. if(len == SIZE_MAX) utils_err(1, NULL);
  217. wchar_t *warg = calloc((len + 1), sizeof(*warg));
  218. if(warg == NULL) utils_err(1, NULL);
  219. arg = optarg;
  220. len = mbsrtowcs(warg, &arg, len + 1, NULL);
  221. if(len == (size_t)-1) utils_err(1, "delimiters");
  222. delimcnt = tr(delim = warg);
  223. break;
  224. }
  225. case 's':
  226. seq = 1;
  227. break;
  228. case 'z':
  229. linedelim = L'\0';
  230. break;
  231. case ':':
  232. fprintf(stderr, "%s: error: Missing operand for option: '-%c'\n", argv0, optopt);
  233. usage();
  234. return 1;
  235. case '?':
  236. if(!got_long_opt) fprintf(stderr, "%s: error: Unrecognised option: '-%c'\n", argv0, optopt);
  237. usage();
  238. return 1;
  239. default:
  240. abort();
  241. }
  242. }
  243. argc -= optind;
  244. argv += optind;
  245. char *dash[] = {(char *)"-", NULL};
  246. char **args = argc > 0 ? argv : dash;
  247. if(!delim)
  248. {
  249. delimcnt = 1;
  250. delim = tab;
  251. }
  252. if(seq)
  253. return sequential(args);
  254. else
  255. return parallel(args);
  256. }