1 ///////////////////////////////////////////////////////////////////////////////
2 //
3 /// \file       message.c
4 /// \brief      Printing messages
5 //
6 //  Author:     Lasse Collin
7 //
8 //  This file has been put into the public domain.
9 //  You can do whatever you want with this file.
10 //
11 ///////////////////////////////////////////////////////////////////////////////
12 
13 #include "private.h"
14 
15 #include <stdarg.h>
16 
17 
18 /// Number of the current file
19 static unsigned int files_pos = 0;
20 
21 /// Total number of input files; zero if unknown.
22 static unsigned int files_total;
23 
24 /// Verbosity level
25 static enum message_verbosity verbosity = V_WARNING;
26 
27 /// Filename which we will print with the verbose messages
28 static const char *filename;
29 
30 /// True once the a filename has been printed to stderr as part of progress
31 /// message. If automatic progress updating isn't enabled, this becomes true
32 /// after the first progress message has been printed due to user sending
33 /// SIGINFO, SIGUSR1, or SIGALRM. Once this variable is true, we will print
34 /// an empty line before the next filename to make the output more readable.
35 static bool first_filename_printed = false;
36 
37 /// This is set to true when we have printed the current filename to stderr
38 /// as part of a progress message. This variable is useful only if not
39 /// updating progress automatically: if user sends many SIGINFO, SIGUSR1, or
40 /// SIGALRM signals, we won't print the name of the same file multiple times.
41 static bool current_filename_printed = false;
42 
43 /// True if we should print progress indicator and update it automatically
44 /// if also verbose >= V_VERBOSE.
45 static bool progress_automatic;
46 
47 /// True if message_progress_start() has been called but
48 /// message_progress_end() hasn't been called yet.
49 static bool progress_started = false;
50 
51 /// This is true when a progress message was printed and the cursor is still
52 /// on the same line with the progress message. In that case, a newline has
53 /// to be printed before any error messages.
54 static bool progress_active = false;
55 
56 /// Pointer to lzma_stream used to do the encoding or decoding.
57 static lzma_stream *progress_strm;
58 
59 /// Expected size of the input stream is needed to show completion percentage
60 /// and estimate remaining time.
61 static uint64_t expected_in_size;
62 
63 
64 // Use alarm() and SIGALRM when they are supported. This has two minor
65 // advantages over the alternative of polling gettimeofday():
66 //  - It is possible for the user to send SIGINFO, SIGUSR1, or SIGALRM to
67 //    get intermediate progress information even when --verbose wasn't used
68 //    or stderr is not a terminal.
69 //  - alarm() + SIGALRM seems to have slightly less overhead than polling
70 //    gettimeofday().
71 #ifdef SIGALRM
72 
73 const int message_progress_sigs[] = {
74           SIGALRM,
75 #ifdef SIGINFO
76           SIGINFO,
77 #endif
78 #ifdef SIGUSR1
79           SIGUSR1,
80 #endif
81           0
82 };
83 
84 /// The signal handler for SIGALRM sets this to true. It is set back to false
85 /// once the progress message has been updated.
86 static volatile sig_atomic_t progress_needs_updating = false;
87 
88 /// Signal handler for SIGALRM
89 static void
progress_signal_handler(int sig lzma_attribute ((__unused__)))90 progress_signal_handler(int sig lzma_attribute((__unused__)))
91 {
92           progress_needs_updating = true;
93           return;
94 }
95 
96 #else
97 
98 /// This is true when progress message printing is wanted. Using the same
99 /// variable name as above to avoid some ifdefs.
100 static bool progress_needs_updating = false;
101 
102 /// Elapsed time when the next progress message update should be done.
103 static uint64_t progress_next_update;
104 
105 #endif
106 
107 
108 extern void
message_init(void)109 message_init(void)
110 {
111           // If --verbose is used, we use a progress indicator if and only
112           // if stderr is a terminal. If stderr is not a terminal, we print
113           // verbose information only after finishing the file. As a special
114           // exception, even if --verbose was not used, user can send SIGALRM
115           // to make us print progress information once without automatic
116           // updating.
117           progress_automatic = isatty(STDERR_FILENO);
118 
119           // Commented out because COLUMNS is rarely exported to environment.
120           // Most users have at least 80 columns anyway, let's think something
121           // fancy here if enough people complain.
122 /*
123           if (progress_automatic) {
124                     // stderr is a terminal. Check the COLUMNS environment
125                     // variable to see if the terminal is wide enough. If COLUMNS
126                     // doesn't exist or it has some unparsable value, we assume
127                     // that the terminal is wide enough.
128                     const char *columns_str = getenv("COLUMNS");
129                     if (columns_str != NULL) {
130                               char *endptr;
131                               const long columns = strtol(columns_str, &endptr, 10);
132                               if (*endptr != '\0' || columns < 80)
133                                         progress_automatic = false;
134                     }
135           }
136 */
137 
138 #ifdef SIGALRM
139           // Establish the signal handlers which set a flag to tell us that
140           // progress info should be updated.
141           struct sigaction sa;
142           sigemptyset(&sa.sa_mask);
143           sa.sa_flags = 0;
144           sa.sa_handler = &progress_signal_handler;
145 
146           for (size_t i = 0; message_progress_sigs[i] != 0; ++i)
147                     if (sigaction(message_progress_sigs[i], &sa, NULL))
148                               message_signal_handler();
149 #endif
150 
151           return;
152 }
153 
154 
155 extern void
message_verbosity_increase(void)156 message_verbosity_increase(void)
157 {
158           if (verbosity < V_DEBUG)
159                     ++verbosity;
160 
161           return;
162 }
163 
164 
165 extern void
message_verbosity_decrease(void)166 message_verbosity_decrease(void)
167 {
168           if (verbosity > V_SILENT)
169                     --verbosity;
170 
171           return;
172 }
173 
174 
175 extern enum message_verbosity
message_verbosity_get(void)176 message_verbosity_get(void)
177 {
178           return verbosity;
179 }
180 
181 
182 extern void
message_set_files(unsigned int files)183 message_set_files(unsigned int files)
184 {
185           files_total = files;
186           return;
187 }
188 
189 
190 /// Prints the name of the current file if it hasn't been printed already,
191 /// except if we are processing exactly one stream from stdin to stdout.
192 /// I think it looks nicer to not print "(stdin)" when --verbose is used
193 /// in a pipe and no other files are processed.
194 static void
print_filename(void)195 print_filename(void)
196 {
197           if (!opt_robot && (files_total != 1 || filename != stdin_filename)) {
198                     signals_block();
199 
200                     FILE *file = opt_mode == MODE_LIST ? stdout : stderr;
201 
202                     // If a file was already processed, put an empty line
203                     // before the next filename to improve readability.
204                     if (first_filename_printed)
205                               fputc('\n', file);
206 
207                     first_filename_printed = true;
208                     current_filename_printed = true;
209 
210                     // If we don't know how many files there will be due
211                     // to usage of --files or --files0.
212                     if (files_total == 0)
213                               fprintf(file, "%s (%u)\n", filename,
214                                                   files_pos);
215                     else
216                               fprintf(file, "%s (%u/%u)\n", filename,
217                                                   files_pos, files_total);
218 
219                     signals_unblock();
220           }
221 
222           return;
223 }
224 
225 
226 extern void
message_filename(const char * src_name)227 message_filename(const char *src_name)
228 {
229           // Start numbering the files starting from one.
230           ++files_pos;
231           filename = src_name;
232 
233           if (verbosity >= V_VERBOSE
234                               && (progress_automatic || opt_mode == MODE_LIST))
235                     print_filename();
236           else
237                     current_filename_printed = false;
238 
239           return;
240 }
241 
242 
243 extern void
message_progress_start(lzma_stream * strm,uint64_t in_size)244 message_progress_start(lzma_stream *strm, uint64_t in_size)
245 {
246           // Store the pointer to the lzma_stream used to do the coding.
247           // It is needed to find out the position in the stream.
248           progress_strm = strm;
249 
250           // Store the expected size of the file. If we aren't printing any
251           // statistics, then is will be unused. But since it is possible
252           // that the user sends us a signal to show statistics, we need
253           // to have it available anyway.
254           expected_in_size = in_size;
255 
256           // Indicate that progress info may need to be printed before
257           // printing error messages.
258           progress_started = true;
259 
260           // If progress indicator is wanted, print the filename and possibly
261           // the file count now.
262           if (verbosity >= V_VERBOSE && progress_automatic) {
263                     // Start the timer to display the first progress message
264                     // after one second. An alternative would be to show the
265                     // first message almost immediately, but delaying by one
266                     // second looks better to me, since extremely early
267                     // progress info is pretty much useless.
268 #ifdef SIGALRM
269                     // First disable a possibly existing alarm.
270                     alarm(0);
271                     progress_needs_updating = false;
272                     alarm(1);
273 #else
274                     progress_needs_updating = true;
275                     progress_next_update = 1000;
276 #endif
277           }
278 
279           return;
280 }
281 
282 
283 /// Make the string indicating completion percentage.
284 static const char *
progress_percentage(uint64_t in_pos)285 progress_percentage(uint64_t in_pos)
286 {
287           // If the size of the input file is unknown or the size told us is
288           // clearly wrong since we have processed more data than the alleged
289           // size of the file, show a static string indicating that we have
290           // no idea of the completion percentage.
291           if (expected_in_size == 0 || in_pos > expected_in_size)
292                     return "--- %";
293 
294           // Never show 100.0 % before we actually are finished.
295           double percentage = (double)(in_pos) / (double)(expected_in_size)
296                               * 99.9;
297 
298           // Use big enough buffer to hold e.g. a multibyte decimal point.
299           static char buf[16];
300           snprintf(buf, sizeof(buf), "%.1f %%", percentage);
301 
302           return buf;
303 }
304 
305 
306 /// Make the string containing the amount of input processed, amount of
307 /// output produced, and the compression ratio.
308 static const char *
progress_sizes(uint64_t compressed_pos,uint64_t uncompressed_pos,bool final)309 progress_sizes(uint64_t compressed_pos, uint64_t uncompressed_pos, bool final)
310 {
311           // Use big enough buffer to hold e.g. a multibyte thousand separators.
312           static char buf[128];
313           char *pos = buf;
314           size_t left = sizeof(buf);
315 
316           // Print the sizes. If this the final message, use more reasonable
317           // units than MiB if the file was small.
318           const enum nicestr_unit unit_min = final ? NICESTR_B : NICESTR_MIB;
319           my_snprintf(&pos, &left, "%s / %s",
320                               uint64_to_nicestr(compressed_pos,
321                                         unit_min, NICESTR_TIB, false, 0),
322                               uint64_to_nicestr(uncompressed_pos,
323                                         unit_min, NICESTR_TIB, false, 1));
324 
325           // Avoid division by zero. If we cannot calculate the ratio, set
326           // it to some nice number greater than 10.0 so that it gets caught
327           // in the next if-clause.
328           const double ratio = uncompressed_pos > 0
329                               ? (double)(compressed_pos) / (double)(uncompressed_pos)
330                               : 16.0;
331 
332           // If the ratio is very bad, just indicate that it is greater than
333           // 9.999. This way the length of the ratio field stays fixed.
334           if (ratio > 9.999)
335                     snprintf(pos, left, " > %.3f", 9.999);
336           else
337                     snprintf(pos, left, " = %.3f", ratio);
338 
339           return buf;
340 }
341 
342 
343 /// Make the string containing the processing speed of uncompressed data.
344 static const char *
progress_speed(uint64_t uncompressed_pos,uint64_t elapsed)345 progress_speed(uint64_t uncompressed_pos, uint64_t elapsed)
346 {
347           // Don't print the speed immediately, since the early values look
348           // somewhat random.
349           if (elapsed < 3000)
350                     return "";
351 
352           static const char unit[][8] = {
353                     "KiB/s",
354                     "MiB/s",
355                     "GiB/s",
356           };
357 
358           size_t unit_index = 0;
359 
360           // Calculate the speed as KiB/s.
361           double speed = (double)(uncompressed_pos)
362                               / ((double)(elapsed) * (1024.0 / 1000.0));
363 
364           // Adjust the unit of the speed if needed.
365           while (speed > 999.0) {
366                     speed /= 1024.0;
367                     if (++unit_index == ARRAY_SIZE(unit))
368                               return ""; // Way too fast ;-)
369           }
370 
371           // Use decimal point only if the number is small. Examples:
372           //  - 0.1 KiB/s
373           //  - 9.9 KiB/s
374           //  - 99 KiB/s
375           //  - 999 KiB/s
376           // Use big enough buffer to hold e.g. a multibyte decimal point.
377           static char buf[16];
378           snprintf(buf, sizeof(buf), "%.*f %s",
379                               speed > 9.9 ? 0 : 1, speed, unit[unit_index]);
380           return buf;
381 }
382 
383 
384 /// Make a string indicating elapsed time. The format is either
385 /// M:SS or H:MM:SS depending on if the time is an hour or more.
386 static const char *
progress_time(uint64_t mseconds)387 progress_time(uint64_t mseconds)
388 {
389           // 9999 hours = 416 days
390           static char buf[sizeof("9999:59:59")];
391 
392           // 32-bit variable is enough for elapsed time (136 years).
393           uint32_t seconds = (uint32_t)(mseconds / 1000);
394 
395           // Don't show anything if the time is zero or ridiculously big.
396           if (seconds == 0 || seconds > ((9999 * 60) + 59) * 60 + 59)
397                     return "";
398 
399           uint32_t minutes = seconds / 60;
400           seconds %= 60;
401 
402           if (minutes >= 60) {
403                     const uint32_t hours = minutes / 60;
404                     minutes %= 60;
405                     snprintf(buf, sizeof(buf),
406                                         "%" PRIu32 ":%02" PRIu32 ":%02" PRIu32,
407                                         hours, minutes, seconds);
408           } else {
409                     snprintf(buf, sizeof(buf), "%" PRIu32 ":%02" PRIu32,
410                                         minutes, seconds);
411           }
412 
413           return buf;
414 }
415 
416 
417 /// Return a string containing estimated remaining time when
418 /// reasonably possible.
419 static const char *
progress_remaining(uint64_t in_pos,uint64_t elapsed)420 progress_remaining(uint64_t in_pos, uint64_t elapsed)
421 {
422           // Don't show the estimated remaining time when it wouldn't
423           // make sense:
424           //  - Input size is unknown.
425           //  - Input has grown bigger since we started (de)compressing.
426           //  - We haven't processed much data yet, so estimate would be
427           //    too inaccurate.
428           //  - Only a few seconds has passed since we started (de)compressing,
429           //    so estimate would be too inaccurate.
430           if (expected_in_size == 0 || in_pos > expected_in_size
431                               || in_pos < (UINT64_C(1) << 19) || elapsed < 8000)
432                     return "";
433 
434           // Calculate the estimate. Don't give an estimate of zero seconds,
435           // since it is possible that all the input has been already passed
436           // to the library, but there is still quite a bit of output pending.
437           uint32_t remaining = (double)(expected_in_size - in_pos)
438                               * ((double)(elapsed) / 1000.0) / (double)(in_pos);
439           if (remaining < 1)
440                     remaining = 1;
441 
442           static char buf[sizeof("9 h 55 min")];
443 
444           // Select appropriate precision for the estimated remaining time.
445           if (remaining <= 10) {
446                     // A maximum of 10 seconds remaining.
447                     // Show the number of seconds as is.
448                     snprintf(buf, sizeof(buf), "%" PRIu32 " s", remaining);
449 
450           } else if (remaining <= 50) {
451                     // A maximum of 50 seconds remaining.
452                     // Round up to the next multiple of five seconds.
453                     remaining = (remaining + 4) / 5 * 5;
454                     snprintf(buf, sizeof(buf), "%" PRIu32 " s", remaining);
455 
456           } else if (remaining <= 590) {
457                     // A maximum of 9 minutes and 50 seconds remaining.
458                     // Round up to the next multiple of ten seconds.
459                     remaining = (remaining + 9) / 10 * 10;
460                     snprintf(buf, sizeof(buf), "%" PRIu32 " min %" PRIu32 " s",
461                                         remaining / 60, remaining % 60);
462 
463           } else if (remaining <= 59 * 60) {
464                     // A maximum of 59 minutes remaining.
465                     // Round up to the next multiple of a minute.
466                     remaining = (remaining + 59) / 60;
467                     snprintf(buf, sizeof(buf), "%" PRIu32 " min", remaining);
468 
469           } else if (remaining <= 9 * 3600 + 50 * 60) {
470                     // A maximum of 9 hours and 50 minutes left.
471                     // Round up to the next multiple of ten minutes.
472                     remaining = (remaining + 599) / 600 * 10;
473                     snprintf(buf, sizeof(buf), "%" PRIu32 " h %" PRIu32 " min",
474                                         remaining / 60, remaining % 60);
475 
476           } else if (remaining <= 23 * 3600) {
477                     // A maximum of 23 hours remaining.
478                     // Round up to the next multiple of an hour.
479                     remaining = (remaining + 3599) / 3600;
480                     snprintf(buf, sizeof(buf), "%" PRIu32 " h", remaining);
481 
482           } else if (remaining <= 9 * 24 * 3600 + 23 * 3600) {
483                     // A maximum of 9 days and 23 hours remaining.
484                     // Round up to the next multiple of an hour.
485                     remaining = (remaining + 3599) / 3600;
486                     snprintf(buf, sizeof(buf), "%" PRIu32 " d %" PRIu32 " h",
487                                         remaining / 24, remaining % 24);
488 
489           } else if (remaining <= 999 * 24 * 3600) {
490                     // A maximum of 999 days remaining. ;-)
491                     // Round up to the next multiple of a day.
492                     remaining = (remaining + 24 * 3600 - 1) / (24 * 3600);
493                     snprintf(buf, sizeof(buf), "%" PRIu32 " d", remaining);
494 
495           } else {
496                     // The estimated remaining time is too big. Don't show it.
497                     return "";
498           }
499 
500           return buf;
501 }
502 
503 
504 /// Get how much uncompressed and compressed data has been processed.
505 static void
progress_pos(uint64_t * in_pos,uint64_t * compressed_pos,uint64_t * uncompressed_pos)506 progress_pos(uint64_t *in_pos,
507                     uint64_t *compressed_pos, uint64_t *uncompressed_pos)
508 {
509           uint64_t out_pos;
510           lzma_get_progress(progress_strm, in_pos, &out_pos);
511 
512           // It cannot have processed more input than it has been given.
513           assert(*in_pos <= progress_strm->total_in);
514 
515           // It cannot have produced more output than it claims to have ready.
516           assert(out_pos >= progress_strm->total_out);
517 
518           if (opt_mode == MODE_COMPRESS) {
519                     *compressed_pos = out_pos;
520                     *uncompressed_pos = *in_pos;
521           } else {
522                     *compressed_pos = *in_pos;
523                     *uncompressed_pos = out_pos;
524           }
525 
526           return;
527 }
528 
529 
530 extern void
message_progress_update(void)531 message_progress_update(void)
532 {
533           if (!progress_needs_updating)
534                     return;
535 
536           // Calculate how long we have been processing this file.
537           const uint64_t elapsed = mytime_get_elapsed();
538 
539 #ifndef SIGALRM
540           if (progress_next_update > elapsed)
541                     return;
542 
543           progress_next_update = elapsed + 1000;
544 #endif
545 
546           // Get our current position in the stream.
547           uint64_t in_pos;
548           uint64_t compressed_pos;
549           uint64_t uncompressed_pos;
550           progress_pos(&in_pos, &compressed_pos, &uncompressed_pos);
551 
552           // Block signals so that fprintf() doesn't get interrupted.
553           signals_block();
554 
555           // Print the filename if it hasn't been printed yet.
556           if (!current_filename_printed)
557                     print_filename();
558 
559           // Print the actual progress message. The idea is that there is at
560           // least three spaces between the fields in typical situations, but
561           // even in rare situations there is at least one space.
562           const char *cols[5] = {
563                     progress_percentage(in_pos),
564                     progress_sizes(compressed_pos, uncompressed_pos, false),
565                     progress_speed(uncompressed_pos, elapsed),
566                     progress_time(elapsed),
567                     progress_remaining(in_pos, elapsed),
568           };
569           fprintf(stderr, "\r %*s %*s   %*s %10s   %10s\r",
570                               tuklib_mbstr_fw(cols[0], 6), cols[0],
571                               tuklib_mbstr_fw(cols[1], 35), cols[1],
572                               tuklib_mbstr_fw(cols[2], 9), cols[2],
573                               cols[3],
574                               cols[4]);
575 
576 #ifdef SIGALRM
577           // Updating the progress info was finished. Reset
578           // progress_needs_updating to wait for the next SIGALRM.
579           //
580           // NOTE: This has to be done before alarm(1) or with (very) bad
581           // luck we could be setting this to false after the alarm has already
582           // been triggered.
583           progress_needs_updating = false;
584 
585           if (verbosity >= V_VERBOSE && progress_automatic) {
586                     // Mark that the progress indicator is active, so if an error
587                     // occurs, the error message gets printed cleanly.
588                     progress_active = true;
589 
590                     // Restart the timer so that progress_needs_updating gets
591                     // set to true after about one second.
592                     alarm(1);
593           } else {
594                     // The progress message was printed because user had sent us
595                     // SIGALRM. In this case, each progress message is printed
596                     // on its own line.
597                     fputc('\n', stderr);
598           }
599 #else
600           // When SIGALRM isn't supported and we get here, it's always due to
601           // automatic progress update. We set progress_active here too like
602           // described above.
603           assert(verbosity >= V_VERBOSE);
604           assert(progress_automatic);
605           progress_active = true;
606 #endif
607 
608           signals_unblock();
609 
610           return;
611 }
612 
613 
614 static void
progress_flush(bool finished)615 progress_flush(bool finished)
616 {
617           if (!progress_started || verbosity < V_VERBOSE)
618                     return;
619 
620           uint64_t in_pos;
621           uint64_t compressed_pos;
622           uint64_t uncompressed_pos;
623           progress_pos(&in_pos, &compressed_pos, &uncompressed_pos);
624 
625           // Avoid printing intermediate progress info if some error occurs
626           // in the beginning of the stream. (If something goes wrong later in
627           // the stream, it is sometimes useful to tell the user where the
628           // error approximately occurred, especially if the error occurs
629           // after a time-consuming operation.)
630           if (!finished && !progress_active
631                               && (compressed_pos == 0 || uncompressed_pos == 0))
632                     return;
633 
634           progress_active = false;
635 
636           const uint64_t elapsed = mytime_get_elapsed();
637 
638           signals_block();
639 
640           // When using the auto-updating progress indicator, the final
641           // statistics are printed in the same format as the progress
642           // indicator itself.
643           if (progress_automatic) {
644                     const char *cols[5] = {
645                               finished ? "100 %" : progress_percentage(in_pos),
646                               progress_sizes(compressed_pos, uncompressed_pos, true),
647                               progress_speed(uncompressed_pos, elapsed),
648                               progress_time(elapsed),
649                               finished ? "" : progress_remaining(in_pos, elapsed),
650                     };
651                     fprintf(stderr, "\r %*s %*s   %*s %10s   %10s\n",
652                                         tuklib_mbstr_fw(cols[0], 6), cols[0],
653                                         tuklib_mbstr_fw(cols[1], 35), cols[1],
654                                         tuklib_mbstr_fw(cols[2], 9), cols[2],
655                                         cols[3],
656                                         cols[4]);
657           } else {
658                     // The filename is always printed.
659                     fprintf(stderr, "%s: ", filename);
660 
661                     // Percentage is printed only if we didn't finish yet.
662                     if (!finished) {
663                               // Don't print the percentage when it isn't known
664                               // (starts with a dash).
665                               const char *percentage = progress_percentage(in_pos);
666                               if (percentage[0] != '-')
667                                         fprintf(stderr, "%s, ", percentage);
668                     }
669 
670                     // Size information is always printed.
671                     fprintf(stderr, "%s", progress_sizes(
672                                         compressed_pos, uncompressed_pos, true));
673 
674                     // The speed and elapsed time aren't always shown.
675                     const char *speed = progress_speed(uncompressed_pos, elapsed);
676                     if (speed[0] != '\0')
677                               fprintf(stderr, ", %s", speed);
678 
679                     const char *elapsed_str = progress_time(elapsed);
680                     if (elapsed_str[0] != '\0')
681                               fprintf(stderr, ", %s", elapsed_str);
682 
683                     fputc('\n', stderr);
684           }
685 
686           signals_unblock();
687 
688           return;
689 }
690 
691 
692 extern void
message_progress_end(bool success)693 message_progress_end(bool success)
694 {
695           assert(progress_started);
696           progress_flush(success);
697           progress_started = false;
698           return;
699 }
700 
701 
702 static void
vmessage(enum message_verbosity v,const char * fmt,va_list ap)703 vmessage(enum message_verbosity v, const char *fmt, va_list ap)
704 {
705           if (v <= verbosity) {
706                     signals_block();
707 
708                     progress_flush(false);
709 
710                     // TRANSLATORS: This is the program name in the beginning
711                     // of the line in messages. Usually it becomes "xz: ".
712                     // This is a translatable string because French needs
713                     // a space before a colon.
714                     fprintf(stderr, _("%s: "), progname);
715                     vfprintf(stderr, fmt, ap);
716                     fputc('\n', stderr);
717 
718                     signals_unblock();
719           }
720 
721           return;
722 }
723 
724 
725 extern void
message(enum message_verbosity v,const char * fmt,...)726 message(enum message_verbosity v, const char *fmt, ...)
727 {
728           va_list ap;
729           va_start(ap, fmt);
730           vmessage(v, fmt, ap);
731           va_end(ap);
732           return;
733 }
734 
735 
736 extern void
message_warning(const char * fmt,...)737 message_warning(const char *fmt, ...)
738 {
739           va_list ap;
740           va_start(ap, fmt);
741           vmessage(V_WARNING, fmt, ap);
742           va_end(ap);
743 
744           set_exit_status(E_WARNING);
745           return;
746 }
747 
748 
749 extern void
message_error(const char * fmt,...)750 message_error(const char *fmt, ...)
751 {
752           va_list ap;
753           va_start(ap, fmt);
754           vmessage(V_ERROR, fmt, ap);
755           va_end(ap);
756 
757           set_exit_status(E_ERROR);
758           return;
759 }
760 
761 
762 extern void
message_fatal(const char * fmt,...)763 message_fatal(const char *fmt, ...)
764 {
765           va_list ap;
766           va_start(ap, fmt);
767           vmessage(V_ERROR, fmt, ap);
768           va_end(ap);
769 
770           tuklib_exit(E_ERROR, E_ERROR, false);
771 }
772 
773 
774 extern void
message_bug(void)775 message_bug(void)
776 {
777           message_fatal(_("Internal error (bug)"));
778 }
779 
780 
781 extern void
message_signal_handler(void)782 message_signal_handler(void)
783 {
784           message_fatal(_("Cannot establish signal handlers"));
785 }
786 
787 
788 extern const char *
message_strm(lzma_ret code)789 message_strm(lzma_ret code)
790 {
791           switch (code) {
792           case LZMA_NO_CHECK:
793                     return _("No integrity check; not verifying file integrity");
794 
795           case LZMA_UNSUPPORTED_CHECK:
796                     return _("Unsupported type of integrity check; "
797                                         "not verifying file integrity");
798 
799           case LZMA_MEM_ERROR:
800                     return strerror(ENOMEM);
801 
802           case LZMA_MEMLIMIT_ERROR:
803                     return _("Memory usage limit reached");
804 
805           case LZMA_FORMAT_ERROR:
806                     return _("File format not recognized");
807 
808           case LZMA_OPTIONS_ERROR:
809                     return _("Unsupported options");
810 
811           case LZMA_DATA_ERROR:
812                     return _("Compressed data is corrupt");
813 
814           case LZMA_BUF_ERROR:
815                     return _("Unexpected end of input");
816 
817           case LZMA_OK:
818           case LZMA_STREAM_END:
819           case LZMA_GET_CHECK:
820           case LZMA_PROG_ERROR:
821                     // Without "default", compiler will warn if new constants
822                     // are added to lzma_ret, it is not too easy to forget to
823                     // add the new constants to this function.
824                     break;
825           }
826 
827           return _("Internal error (bug)");
828 }
829 
830 
831 extern void
message_mem_needed(enum message_verbosity v,uint64_t memusage)832 message_mem_needed(enum message_verbosity v, uint64_t memusage)
833 {
834           if (v > verbosity)
835                     return;
836 
837           // Convert memusage to MiB, rounding up to the next full MiB.
838           // This way the user can always use the displayed usage as
839           // the new memory usage limit. (If we rounded to the nearest,
840           // the user might need to +1 MiB to get high enough limit.)
841           memusage = round_up_to_mib(memusage);
842 
843           uint64_t memlimit = hardware_memlimit_get(opt_mode);
844 
845           // Handle the case when there is no memory usage limit.
846           // This way we don't print a weird message with a huge number.
847           if (memlimit == UINT64_MAX) {
848                     message(v, _("%s MiB of memory is required. "
849                                         "The limiter is disabled."),
850                                         uint64_to_str(memusage, 0));
851                     return;
852           }
853 
854           // With US-ASCII:
855           // 2^64 with thousand separators + " MiB" suffix + '\0' = 26 + 4 + 1
856           // But there may be multibyte chars so reserve enough space.
857           char memlimitstr[128];
858 
859           // Show the memory usage limit as MiB unless it is less than 1 MiB.
860           // This way it's easy to notice errors where one has typed
861           // --memory=123 instead of --memory=123MiB.
862           if (memlimit < (UINT32_C(1) << 20)) {
863                     snprintf(memlimitstr, sizeof(memlimitstr), "%s B",
864                                         uint64_to_str(memlimit, 1));
865           } else {
866                     // Round up just like with memusage. If this function is
867                     // called for informational purposes (to just show the
868                     // current usage and limit), we should never show that
869                     // the usage is higher than the limit, which would give
870                     // a false impression that the memory usage limit isn't
871                     // properly enforced.
872                     snprintf(memlimitstr, sizeof(memlimitstr), "%s MiB",
873                                         uint64_to_str(round_up_to_mib(memlimit), 1));
874           }
875 
876           message(v, _("%s MiB of memory is required. The limit is %s."),
877                               uint64_to_str(memusage, 0), memlimitstr);
878 
879           return;
880 }
881 
882 
883 /// \brief      Convert uint32_t to a nice string for --lzma[12]=dict=SIZE
884 ///
885 /// The idea is to use KiB or MiB suffix when possible.
886 static const char *
uint32_to_optstr(uint32_t num)887 uint32_to_optstr(uint32_t num)
888 {
889           static char buf[16];
890 
891           if ((num & ((UINT32_C(1) << 20) - 1)) == 0)
892                     snprintf(buf, sizeof(buf), "%" PRIu32 "MiB", num >> 20);
893           else if ((num & ((UINT32_C(1) << 10) - 1)) == 0)
894                     snprintf(buf, sizeof(buf), "%" PRIu32 "KiB", num >> 10);
895           else
896                     snprintf(buf, sizeof(buf), "%" PRIu32, num);
897 
898           return buf;
899 }
900 
901 
902 extern void
message_filters_to_str(char buf[FILTERS_STR_SIZE],const lzma_filter * filters,bool all_known)903 message_filters_to_str(char buf[FILTERS_STR_SIZE],
904                     const lzma_filter *filters, bool all_known)
905 {
906           char *pos = buf;
907           size_t left = FILTERS_STR_SIZE;
908 
909           for (size_t i = 0; filters[i].id != LZMA_VLI_UNKNOWN; ++i) {
910                     // Add the dashes for the filter option. A space is
911                     // needed after the first and later filters.
912                     my_snprintf(&pos, &left, "%s", i == 0 ? "--" : " --");
913 
914                     switch (filters[i].id) {
915                     case LZMA_FILTER_LZMA1:
916                     case LZMA_FILTER_LZMA2: {
917                               const lzma_options_lzma *opt = filters[i].options;
918                               const char *mode = NULL;
919                               const char *mf = NULL;
920 
921                               if (all_known) {
922                                         switch (opt->mode) {
923                                         case LZMA_MODE_FAST:
924                                                   mode = "fast";
925                                                   break;
926 
927                                         case LZMA_MODE_NORMAL:
928                                                   mode = "normal";
929                                                   break;
930 
931                                         default:
932                                                   mode = "UNKNOWN";
933                                                   break;
934                                         }
935 
936                                         switch (opt->mf) {
937                                         case LZMA_MF_HC3:
938                                                   mf = "hc3";
939                                                   break;
940 
941                                         case LZMA_MF_HC4:
942                                                   mf = "hc4";
943                                                   break;
944 
945                                         case LZMA_MF_BT2:
946                                                   mf = "bt2";
947                                                   break;
948 
949                                         case LZMA_MF_BT3:
950                                                   mf = "bt3";
951                                                   break;
952 
953                                         case LZMA_MF_BT4:
954                                                   mf = "bt4";
955                                                   break;
956 
957                                         default:
958                                                   mf = "UNKNOWN";
959                                                   break;
960                                         }
961                               }
962 
963                               // Add the filter name and dictionary size, which
964                               // is always known.
965                               my_snprintf(&pos, &left, "lzma%c=dict=%s",
966                                                   filters[i].id == LZMA_FILTER_LZMA2
967                                                             ? '2' : '1',
968                                                   uint32_to_optstr(opt->dict_size));
969 
970                               // With LZMA1 also lc/lp/pb are known when
971                               // decompressing, but this function is never
972                               // used to print information about .lzma headers.
973                               assert(filters[i].id == LZMA_FILTER_LZMA2
974                                                   || all_known);
975 
976                               // Print the rest of the options, which are known
977                               // only when compressing.
978                               if (all_known)
979                                         my_snprintf(&pos, &left,
980                                                   ",lc=%" PRIu32 ",lp=%" PRIu32
981                                                   ",pb=%" PRIu32
982                                                   ",mode=%s,nice=%" PRIu32 ",mf=%s"
983                                                   ",depth=%" PRIu32,
984                                                   opt->lc, opt->lp, opt->pb,
985                                                   mode, opt->nice_len, mf, opt->depth);
986                               break;
987                     }
988 
989                     case LZMA_FILTER_X86:
990                     case LZMA_FILTER_POWERPC:
991                     case LZMA_FILTER_IA64:
992                     case LZMA_FILTER_ARM:
993                     case LZMA_FILTER_ARMTHUMB:
994                     case LZMA_FILTER_SPARC: {
995                               static const char bcj_names[][9] = {
996                                         "x86",
997                                         "powerpc",
998                                         "ia64",
999                                         "arm",
1000                                         "armthumb",
1001                                         "sparc",
1002                               };
1003 
1004                               const lzma_options_bcj *opt = filters[i].options;
1005                               my_snprintf(&pos, &left, "%s", bcj_names[filters[i].id
1006                                                   - LZMA_FILTER_X86]);
1007 
1008                               // Show the start offset only when really needed.
1009                               if (opt != NULL && opt->start_offset != 0)
1010                                         my_snprintf(&pos, &left, "=start=%" PRIu32,
1011                                                             opt->start_offset);
1012 
1013                               break;
1014                     }
1015 
1016                     case LZMA_FILTER_DELTA: {
1017                               const lzma_options_delta *opt = filters[i].options;
1018                               my_snprintf(&pos, &left, "delta=dist=%" PRIu32,
1019                                                   opt->dist);
1020                               break;
1021                     }
1022 
1023                     default:
1024                               // This should be possible only if liblzma is
1025                               // newer than the xz tool.
1026                               my_snprintf(&pos, &left, "UNKNOWN");
1027                               break;
1028                     }
1029           }
1030 
1031           return;
1032 }
1033 
1034 
1035 extern void
message_filters_show(enum message_verbosity v,const lzma_filter * filters)1036 message_filters_show(enum message_verbosity v, const lzma_filter *filters)
1037 {
1038           if (v > verbosity)
1039                     return;
1040 
1041           char buf[FILTERS_STR_SIZE];
1042           message_filters_to_str(buf, filters, true);
1043           fprintf(stderr, _("%s: Filter chain: %s\n"), progname, buf);
1044           return;
1045 }
1046 
1047 
1048 extern void
message_try_help(void)1049 message_try_help(void)
1050 {
1051           // Print this with V_WARNING instead of V_ERROR to prevent it from
1052           // showing up when --quiet has been specified.
1053           message(V_WARNING, _("Try `%s --help' for more information."),
1054                               progname);
1055           return;
1056 }
1057 
1058 
1059 extern void
message_version(void)1060 message_version(void)
1061 {
1062           // It is possible that liblzma version is different than the command
1063           // line tool version, so print both.
1064           if (opt_robot) {
1065                     printf("XZ_VERSION=%" PRIu32 "\nLIBLZMA_VERSION=%" PRIu32 "\n",
1066                                         LZMA_VERSION, lzma_version_number());
1067           } else {
1068                     printf("xz (" PACKAGE_NAME ") " LZMA_VERSION_STRING "\n");
1069                     printf("liblzma %s\n", lzma_version_string());
1070           }
1071 
1072           tuklib_exit(E_SUCCESS, E_ERROR, verbosity != V_SILENT);
1073 }
1074 
1075 
1076 extern void
message_help(bool long_help)1077 message_help(bool long_help)
1078 {
1079           printf(_("Usage: %s [OPTION]... [FILE]...\n"
1080                               "Compress or decompress FILEs in the .xz format.\n\n"),
1081                               progname);
1082 
1083           // NOTE: The short help doesn't currently have options that
1084           // take arguments.
1085           if (long_help)
1086                     puts(_("Mandatory arguments to long options are mandatory "
1087                                         "for short options too.\n"));
1088 
1089           if (long_help)
1090                     puts(_(" Operation mode:\n"));
1091 
1092           puts(_(
1093 "  -z, --compress      force compression\n"
1094 "  -d, --decompress    force decompression\n"
1095 "  -t, --test          test compressed file integrity\n"
1096 "  -l, --list          list information about .xz files"));
1097 
1098           if (long_help)
1099                     puts(_("\n Operation modifiers:\n"));
1100 
1101           puts(_(
1102 "  -k, --keep          keep (don't delete) input files\n"
1103 "  -f, --force         force overwrite of output file and (de)compress links\n"
1104 "  -c, --stdout        write to standard output and don't delete input files"));
1105 
1106           if (long_help) {
1107                     puts(_(
1108 "      --single-stream decompress only the first stream, and silently\n"
1109 "                      ignore possible remaining input data"));
1110                     puts(_(
1111 "      --no-sparse     do not create sparse files when decompressing\n"
1112 "  -S, --suffix=.SUF   use the suffix `.SUF' on compressed files\n"
1113 "      --files[=FILE]  read filenames to process from FILE; if FILE is\n"
1114 "                      omitted, filenames are read from the standard input;\n"
1115 "                      filenames must be terminated with the newline character\n"
1116 "      --files0[=FILE] like --files but use the null character as terminator"));
1117           }
1118 
1119           if (long_help) {
1120                     puts(_("\n Basic file format and compression options:\n"));
1121                     puts(_(
1122 "  -F, --format=FMT    file format to encode or decode; possible values are\n"
1123 "                      `auto' (default), `xz', `lzma', and `raw'\n"
1124 "  -C, --check=CHECK   integrity check type: `none' (use with caution),\n"
1125 "                      `crc32', `crc64' (default), or `sha256'"));
1126                     puts(_(
1127 "      --ignore-check  don't verify the integrity check when decompressing"));
1128           }
1129 
1130           puts(_(
1131 "  -0 ... -9           compression preset; default is 6; take compressor *and*\n"
1132 "                      decompressor memory usage into account before using 7-9!"));
1133 
1134           puts(_(
1135 "  -e, --extreme       try to improve compression ratio by using more CPU time;\n"
1136 "                      does not affect decompressor memory requirements"));
1137 
1138           puts(_(
1139 "  -T, --threads=NUM   use at most NUM threads; the default is 1; set to 0\n"
1140 "                      to use as many threads as there are processor cores"));
1141 
1142           if (long_help) {
1143                     puts(_(
1144 "      --block-size=SIZE\n"
1145 "                      start a new .xz block after every SIZE bytes of input;\n"
1146 "                      use this to set the block size for threaded compression"));
1147                     puts(_(
1148 "      --block-list=SIZES\n"
1149 "                      start a new .xz block after the given comma-separated\n"
1150 "                      intervals of uncompressed data"));
1151                     puts(_(
1152 "      --flush-timeout=TIMEOUT\n"
1153 "                      when compressing, if more than TIMEOUT milliseconds has\n"
1154 "                      passed since the previous flush and reading more input\n"
1155 "                      would block, all pending data is flushed out"
1156                     ));
1157                     puts(_( // xgettext:no-c-format
1158 "      --memlimit-compress=LIMIT\n"
1159 "      --memlimit-decompress=LIMIT\n"
1160 "  -M, --memlimit=LIMIT\n"
1161 "                      set memory usage limit for compression, decompression,\n"
1162 "                      or both; LIMIT is in bytes, % of RAM, or 0 for defaults"));
1163 
1164                     puts(_(
1165 "      --no-adjust     if compression settings exceed the memory usage limit,\n"
1166 "                      give an error instead of adjusting the settings downwards"));
1167           }
1168 
1169           if (long_help) {
1170                     puts(_(
1171 "\n Custom filter chain for compression (alternative for using presets):"));
1172 
1173 #if defined(HAVE_ENCODER_LZMA1) || defined(HAVE_DECODER_LZMA1) \
1174                     || defined(HAVE_ENCODER_LZMA2) || defined(HAVE_DECODER_LZMA2)
1175                     // TRANSLATORS: The word "literal" in "literal context bits"
1176                     // means how many "context bits" to use when encoding
1177                     // literals. A literal is a single 8-bit byte. It doesn't
1178                     // mean "literally" here.
1179                     puts(_(
1180 "\n"
1181 "  --lzma1[=OPTS]      LZMA1 or LZMA2; OPTS is a comma-separated list of zero or\n"
1182 "  --lzma2[=OPTS]      more of the following options (valid values; default):\n"
1183 "                        preset=PRE reset options to a preset (0-9[e])\n"
1184 "                        dict=NUM   dictionary size (4KiB - 1536MiB; 8MiB)\n"
1185 "                        lc=NUM     number of literal context bits (0-4; 3)\n"
1186 "                        lp=NUM     number of literal position bits (0-4; 0)\n"
1187 "                        pb=NUM     number of position bits (0-4; 2)\n"
1188 "                        mode=MODE  compression mode (fast, normal; normal)\n"
1189 "                        nice=NUM   nice length of a match (2-273; 64)\n"
1190 "                        mf=NAME    match finder (hc3, hc4, bt2, bt3, bt4; bt4)\n"
1191 "                        depth=NUM  maximum search depth; 0=automatic (default)"));
1192 #endif
1193 
1194                     puts(_(
1195 "\n"
1196 "  --x86[=OPTS]        x86 BCJ filter (32-bit and 64-bit)\n"
1197 "  --powerpc[=OPTS]    PowerPC BCJ filter (big endian only)\n"
1198 "  --ia64[=OPTS]       IA-64 (Itanium) BCJ filter\n"
1199 "  --arm[=OPTS]        ARM BCJ filter (little endian only)\n"
1200 "  --armthumb[=OPTS]   ARM-Thumb BCJ filter (little endian only)\n"
1201 "  --sparc[=OPTS]      SPARC BCJ filter\n"
1202 "                      Valid OPTS for all BCJ filters:\n"
1203 "                        start=NUM  start offset for conversions (default=0)"));
1204 
1205 #if defined(HAVE_ENCODER_DELTA) || defined(HAVE_DECODER_DELTA)
1206                     puts(_(
1207 "\n"
1208 "  --delta[=OPTS]      Delta filter; valid OPTS (valid values; default):\n"
1209 "                        dist=NUM   distance between bytes being subtracted\n"
1210 "                                   from each other (1-256; 1)"));
1211 #endif
1212           }
1213 
1214           if (long_help)
1215                     puts(_("\n Other options:\n"));
1216 
1217           puts(_(
1218 "  -q, --quiet         suppress warnings; specify twice to suppress errors too\n"
1219 "  -v, --verbose       be verbose; specify twice for even more verbose"));
1220 
1221           if (long_help) {
1222                     puts(_(
1223 "  -Q, --no-warn       make warnings not affect the exit status"));
1224                     puts(_(
1225 "      --robot         use machine-parsable messages (useful for scripts)"));
1226                     puts("");
1227                     puts(_(
1228 "      --info-memory   display the total amount of RAM and the currently active\n"
1229 "                      memory usage limits, and exit"));
1230                     puts(_(
1231 "  -h, --help          display the short help (lists only the basic options)\n"
1232 "  -H, --long-help     display this long help and exit"));
1233           } else {
1234                     puts(_(
1235 "  -h, --help          display this short help and exit\n"
1236 "  -H, --long-help     display the long help (lists also the advanced options)"));
1237           }
1238 
1239           puts(_(
1240 "  -V, --version       display the version number and exit"));
1241 
1242           puts(_("\nWith no FILE, or when FILE is -, read standard input.\n"));
1243 
1244           // TRANSLATORS: This message indicates the bug reporting address
1245           // for this package. Please add _another line_ saying
1246           // "Report translation bugs to <...>\n" with the email or WWW
1247           // address for translation bugs. Thanks.
1248           printf(_("Report bugs to <%s> (in English or Finnish).\n"),
1249                               PACKAGE_BUGREPORT);
1250           printf(_("%s home page: <%s>\n"), PACKAGE_NAME, PACKAGE_URL);
1251 
1252 #if LZMA_VERSION_STABILITY != LZMA_VERSION_STABILITY_STABLE
1253           puts(_(
1254 "THIS IS A DEVELOPMENT VERSION NOT INTENDED FOR PRODUCTION USE."));
1255 #endif
1256 
1257           tuklib_exit(E_SUCCESS, E_ERROR, verbosity != V_SILENT);
1258 }
1259