1 /* comm -- compare two sorted files line by line.
2 Copyright (C) 86, 90, 91, 1995-2005 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
17 /* Written by Richard Stallman and David MacKenzie. */
22 #include <sys/types.h>
24 #include "linebuffer.h"
26 #include "hard-locale.h"
31 /* The official name of this program (e.g., no `g' prefix). */
32 #define PROGRAM_NAME "comm"
34 #define AUTHORS "Richard Stallman", "David MacKenzie"
36 /* Undefine, to avoid warning about redefinition on some systems. */
38 #define min(x, y) ((x) < (y) ? (x) : (y))
40 /* The name this program was run with. */
43 /* True if the LC_COLLATE locale is hard. */
44 static bool hard_LC_COLLATE
;
46 /* If true, print lines that are found only in file 1. */
47 static bool only_file_1
;
49 /* If true, print lines that are found only in file 2. */
50 static bool only_file_2
;
52 /* If true, print lines that are found in both files. */
55 static struct option
const long_options
[] =
57 {GETOPT_HELP_OPTION_DECL
},
58 {GETOPT_VERSION_OPTION_DECL
},
67 if (status
!= EXIT_SUCCESS
)
68 fprintf (stderr
, _("Try `%s --help' for more information.\n"),
73 Usage: %s [OPTION]... FILE1 FILE2\n\
77 Compare sorted files FILE1 and FILE2 line by line.\n\
81 With no options, produce three-column output. Column one contains\n\
82 lines unique to FILE1, column two contains lines unique to FILE2,\n\
83 and column three contains lines common to both files.\n\
87 -1 suppress lines unique to FILE1\n\
88 -2 suppress lines unique to FILE2\n\
89 -3 suppress lines that appear in both files\n\
91 fputs (HELP_OPTION_DESCRIPTION
, stdout
);
92 fputs (VERSION_OPTION_DESCRIPTION
, stdout
);
93 emit_bug_reporting_address ();
98 /* Output the line in linebuffer LINE to stream STREAM
99 provided the switches say it should be output.
100 CLASS is 1 for a line found only in file 1,
101 2 for a line only in file 2, 3 for a line in both. */
104 writeline (const struct linebuffer
*line
, FILE *stream
, int class)
116 /* Print a TAB if we are printing lines from file 1. */
124 /* Print a TAB if we are printing lines from file 1. */
127 /* Print a TAB if we are printing lines from file 2. */
133 fwrite (line
->buffer
, sizeof (char), line
->length
, stream
);
136 /* Compare INFILES[0] and INFILES[1].
137 If either is "-", use the standard input for that file.
138 Assume that each input file is sorted;
139 merge them and output the result. */
142 compare_files (char **infiles
)
144 /* For each file, we have one linebuffer in lb1. */
145 struct linebuffer lb1
[2];
147 /* thisline[i] points to the linebuffer holding the next available line
148 in file i, or is NULL if there are no lines left in that file. */
149 struct linebuffer
*thisline
[2];
151 /* streams[i] holds the input stream for file i. */
156 /* Initialize the storage. */
157 for (i
= 0; i
< 2; i
++)
159 initbuffer (&lb1
[i
]);
160 thisline
[i
] = &lb1
[i
];
161 streams
[i
] = (STREQ (infiles
[i
], "-") ? stdin
: fopen (infiles
[i
], "r"));
163 error (EXIT_FAILURE
, errno
, "%s", infiles
[i
]);
165 thisline
[i
] = readlinebuffer (thisline
[i
], streams
[i
]);
166 if (ferror (streams
[i
]))
167 error (EXIT_FAILURE
, errno
, "%s", infiles
[i
]);
170 while (thisline
[0] || thisline
[1])
174 /* Compare the next available lines of the two files. */
178 else if (!thisline
[1])
183 order
= xmemcoll (thisline
[0]->buffer
, thisline
[0]->length
- 1,
184 thisline
[1]->buffer
, thisline
[1]->length
- 1);
187 size_t len
= min (thisline
[0]->length
, thisline
[1]->length
) - 1;
188 order
= memcmp (thisline
[0]->buffer
, thisline
[1]->buffer
, len
);
190 order
= (thisline
[0]->length
< thisline
[1]->length
192 : thisline
[0]->length
!= thisline
[1]->length
);
196 /* Output the line that is lesser. */
198 writeline (thisline
[1], stdout
, 3);
200 writeline (thisline
[1], stdout
, 2);
202 writeline (thisline
[0], stdout
, 1);
204 /* Step the file the line came from.
205 If the files match, step both files. */
208 thisline
[1] = readlinebuffer (thisline
[1], streams
[1]);
209 if (ferror (streams
[1]))
210 error (EXIT_FAILURE
, errno
, "%s", infiles
[1]);
214 thisline
[0] = readlinebuffer (thisline
[0], streams
[0]);
215 if (ferror (streams
[0]))
216 error (EXIT_FAILURE
, errno
, "%s", infiles
[0]);
220 for (i
= 0; i
< 2; i
++)
221 if (fclose (streams
[i
]) != 0)
222 error (EXIT_FAILURE
, errno
, "%s", infiles
[i
]);
226 main (int argc
, char **argv
)
230 initialize_main (&argc
, &argv
);
231 program_name
= argv
[0];
232 setlocale (LC_ALL
, "");
233 bindtextdomain (PACKAGE
, LOCALEDIR
);
234 textdomain (PACKAGE
);
235 hard_LC_COLLATE
= hard_locale (LC_COLLATE
);
237 atexit (close_stdout
);
243 while ((c
= getopt_long (argc
, argv
, "123", long_options
, NULL
)) != -1)
258 case_GETOPT_HELP_CHAR
;
260 case_GETOPT_VERSION_CHAR (PROGRAM_NAME
, AUTHORS
);
263 usage (EXIT_FAILURE
);
266 if (argc
- optind
< 2)
269 error (0, 0, _("missing operand"));
271 error (0, 0, _("missing operand after %s"), quote (argv
[argc
- 1]));
272 usage (EXIT_FAILURE
);
275 if (2 < argc
- optind
)
277 error (0, 0, _("extra operand %s"), quote (argv
[optind
+ 2]));
278 usage (EXIT_FAILURE
);
281 compare_files (argv
+ optind
);