afdaeee7ed
We deal with the difference between binary and text modes on Windows by doing all I/O in binary mode (including, in particular, stdin/stdout/stderr) and by treating text mode as equivalent to binary mode (i.e. we use Unix line ending semantics). Change-Id: I76a46d8d02cd7efe1931c8272d8f2c311aef3acb Reviewed-on: https://boringssl-review.googlesource.com/3070 Reviewed-by: Adam Langley <agl@google.com>
478 lines
12 KiB
C++
478 lines
12 KiB
C++
/* Copyright (c) 2014, Google Inc.
|
||
*
|
||
* Permission to use, copy, modify, and/or distribute this software for any
|
||
* purpose with or without fee is hereby granted, provided that the above
|
||
* copyright notice and this permission notice appear in all copies.
|
||
*
|
||
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
||
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
||
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
|
||
* SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
||
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
|
||
* OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
|
||
* CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */
|
||
|
||
#include <openssl/base.h>
|
||
|
||
#include <memory>
|
||
#include <string>
|
||
#include <vector>
|
||
|
||
#include <errno.h>
|
||
#include <fcntl.h>
|
||
#include <limits.h>
|
||
#include <stdio.h>
|
||
#include <sys/stat.h>
|
||
#include <sys/types.h>
|
||
|
||
#if !defined(OPENSSL_WINDOWS)
|
||
#include <unistd.h>
|
||
#if !defined(O_BINARY)
|
||
#define O_BINARY 0
|
||
#endif
|
||
#else
|
||
#define NOMINMAX
|
||
#define WIN32_LEAN_AND_MEAN
|
||
#include <windows.h>
|
||
#include <io.h>
|
||
#define PATH_MAX MAX_PATH
|
||
#define read _read
|
||
#endif
|
||
|
||
#include <openssl/digest.h>
|
||
|
||
struct close_delete {
|
||
void operator()(int *fd) {
|
||
close(*fd);
|
||
}
|
||
};
|
||
|
||
template<typename T, typename R, R (*func) (T*)>
|
||
struct func_delete {
|
||
void operator()(T* obj) {
|
||
func(obj);
|
||
}
|
||
};
|
||
|
||
// Source is an awkward expression of a union type in C++: Stdin | File filename.
|
||
struct Source {
|
||
enum Type {
|
||
STDIN,
|
||
};
|
||
|
||
Source() : is_stdin_(false) {}
|
||
Source(Type) : is_stdin_(true) {}
|
||
Source(const std::string &name) : is_stdin_(false), filename_(name) {}
|
||
|
||
bool is_stdin() const { return is_stdin_; }
|
||
const std::string &filename() const { return filename_; }
|
||
|
||
private:
|
||
bool is_stdin_;
|
||
std::string filename_;
|
||
};
|
||
|
||
static const char kStdinName[] = "standard input";
|
||
|
||
// OpenFile opens the regular file named |filename| and sets |*out_fd| to be a
|
||
// file descriptor to it. Returns true on sucess or prints an error to stderr
|
||
// and returns false on error.
|
||
static bool OpenFile(int *out_fd, const std::string &filename) {
|
||
*out_fd = -1;
|
||
|
||
int fd = open(filename.c_str(), O_RDONLY | O_BINARY);
|
||
if (fd < 0) {
|
||
fprintf(stderr, "Failed to open input file '%s': %s\n", filename.c_str(),
|
||
strerror(errno));
|
||
return false;
|
||
}
|
||
|
||
#if !defined(OPENSSL_WINDOWS)
|
||
struct stat st;
|
||
if (fstat(fd, &st)) {
|
||
fprintf(stderr, "Failed to stat input file '%s': %s\n", filename.c_str(),
|
||
strerror(errno));
|
||
goto err;
|
||
}
|
||
|
||
if (!S_ISREG(st.st_mode)) {
|
||
fprintf(stderr, "%s: not a regular file\n", filename.c_str());
|
||
goto err;
|
||
}
|
||
#endif
|
||
|
||
*out_fd = fd;
|
||
return true;
|
||
|
||
err:
|
||
close(fd);
|
||
return false;
|
||
}
|
||
|
||
// SumFile hashes the contents of |source| with |md| and sets |*out_hex| to the
|
||
// hex-encoded result.
|
||
//
|
||
// It returns true on success or prints an error to stderr and returns false on
|
||
// error.
|
||
static bool SumFile(std::string *out_hex, const EVP_MD *md,
|
||
const Source &source) {
|
||
std::unique_ptr<int, close_delete> scoped_fd;
|
||
int fd;
|
||
|
||
if (source.is_stdin()) {
|
||
fd = 0;
|
||
} else {
|
||
if (!OpenFile(&fd, source.filename())) {
|
||
return false;
|
||
}
|
||
scoped_fd.reset(&fd);
|
||
}
|
||
|
||
static const size_t kBufSize = 8192;
|
||
std::unique_ptr<uint8_t[]> buf(new uint8_t[kBufSize]);
|
||
|
||
EVP_MD_CTX ctx;
|
||
EVP_MD_CTX_init(&ctx);
|
||
std::unique_ptr<EVP_MD_CTX, func_delete<EVP_MD_CTX, int, EVP_MD_CTX_cleanup>>
|
||
scoped_ctx(&ctx);
|
||
|
||
if (!EVP_DigestInit_ex(&ctx, md, NULL)) {
|
||
fprintf(stderr, "Failed to initialize EVP_MD_CTX.\n");
|
||
return false;
|
||
}
|
||
|
||
for (;;) {
|
||
ssize_t n;
|
||
|
||
do {
|
||
n = read(fd, buf.get(), kBufSize);
|
||
} while (n == -1 && errno == EINTR);
|
||
|
||
if (n == 0) {
|
||
break;
|
||
} else if (n < 0) {
|
||
fprintf(stderr, "Failed to read from %s: %s\n",
|
||
source.is_stdin() ? kStdinName : source.filename().c_str(),
|
||
strerror(errno));
|
||
return false;
|
||
}
|
||
|
||
if (!EVP_DigestUpdate(&ctx, buf.get(), n)) {
|
||
fprintf(stderr, "Failed to update hash.\n");
|
||
return false;
|
||
}
|
||
}
|
||
|
||
uint8_t digest[EVP_MAX_MD_SIZE];
|
||
unsigned digest_len;
|
||
if (!EVP_DigestFinal_ex(&ctx, digest, &digest_len)) {
|
||
fprintf(stderr, "Failed to finish hash.\n");
|
||
return false;
|
||
}
|
||
|
||
char hex_digest[EVP_MAX_MD_SIZE * 2];
|
||
static const char kHextable[] = "0123456789abcdef";
|
||
for (unsigned i = 0; i < digest_len; i++) {
|
||
const uint8_t b = digest[i];
|
||
hex_digest[i * 2] = kHextable[b >> 4];
|
||
hex_digest[i * 2 + 1] = kHextable[b & 0xf];
|
||
}
|
||
*out_hex = std::string(hex_digest, digest_len * 2);
|
||
|
||
return true;
|
||
}
|
||
|
||
// PrintFileSum hashes |source| with |md| and prints a line to stdout in the
|
||
// format of the coreutils *sum utilities. It returns true on success or prints
|
||
// an error to stderr and returns false on error.
|
||
static bool PrintFileSum(const EVP_MD *md, const Source &source) {
|
||
std::string hex_digest;
|
||
if (!SumFile(&hex_digest, md, source)) {
|
||
return false;
|
||
}
|
||
|
||
// TODO: When given "--binary" or "-b", we should print " *" instead of " "
|
||
// between the digest and the filename.
|
||
//
|
||
// MSYS and Cygwin md5sum default to binary mode by default, whereas other
|
||
// platforms' tools default to text mode by default. We default to text mode
|
||
// by default and consider text mode equivalent to binary mode (i.e. we
|
||
// always use Unix semantics, even on Windows), which means that our default
|
||
// output will differ from the MSYS and Cygwin tools' default output.
|
||
printf("%s %s\n", hex_digest.c_str(),
|
||
source.is_stdin() ? "-" : source.filename().c_str());
|
||
return true;
|
||
}
|
||
|
||
// CheckModeArguments contains arguments for the check mode. See the
|
||
// sha256sum(1) man page for details.
|
||
struct CheckModeArguments {
|
||
bool quiet = false;
|
||
bool status = false;
|
||
bool warn = false;
|
||
bool strict = false;
|
||
};
|
||
|
||
// Check reads lines from |source| where each line is in the format of the
|
||
// coreutils *sum utilities. It attempts to verify each hash by reading the
|
||
// file named in the line.
|
||
//
|
||
// It returns true if all files were verified and, if |args.strict|, no input
|
||
// lines had formatting errors. Otherwise it prints errors to stderr and
|
||
// returns false.
|
||
static bool Check(const CheckModeArguments &args, const EVP_MD *md,
|
||
const Source &source) {
|
||
std::unique_ptr<FILE, func_delete<FILE, int, fclose>> scoped_file;
|
||
FILE *file;
|
||
|
||
if (source.is_stdin()) {
|
||
file = stdin;
|
||
} else {
|
||
int fd;
|
||
if (!OpenFile(&fd, source.filename())) {
|
||
return false;
|
||
}
|
||
|
||
file = fdopen(fd, "rb");
|
||
if (!file) {
|
||
perror("fdopen");
|
||
close(fd);
|
||
return false;
|
||
}
|
||
|
||
scoped_file = std::unique_ptr<FILE, func_delete<FILE, int, fclose>>(file);
|
||
}
|
||
|
||
const size_t hex_size = EVP_MD_size(md) * 2;
|
||
char line[EVP_MAX_MD_SIZE * 2 + 2 /* spaces */ + PATH_MAX + 1 /* newline */ +
|
||
1 /* NUL */];
|
||
unsigned bad_lines = 0;
|
||
unsigned parsed_lines = 0;
|
||
unsigned error_lines = 0;
|
||
unsigned bad_hash_lines = 0;
|
||
unsigned line_no = 0;
|
||
bool ok = true;
|
||
bool draining_overlong_line = false;
|
||
|
||
for (;;) {
|
||
line_no++;
|
||
|
||
if (fgets(line, sizeof(line), file) == nullptr) {
|
||
if (feof(file)) {
|
||
break;
|
||
}
|
||
fprintf(stderr, "Error reading from input.\n");
|
||
return false;
|
||
}
|
||
|
||
size_t len = strlen(line);
|
||
|
||
if (draining_overlong_line) {
|
||
if (line[len - 1] == '\n') {
|
||
draining_overlong_line = false;
|
||
}
|
||
continue;
|
||
}
|
||
|
||
const bool overlong = line[len - 1] != '\n' && !feof(file);
|
||
|
||
if (len < hex_size + 2 /* spaces */ + 1 /* filename */ ||
|
||
line[hex_size] != ' ' ||
|
||
line[hex_size + 1] != ' ' ||
|
||
overlong) {
|
||
bad_lines++;
|
||
if (args.warn) {
|
||
fprintf(stderr, "%s: %u: improperly formatted line\n",
|
||
source.is_stdin() ? kStdinName : source.filename().c_str(), line_no);
|
||
}
|
||
if (args.strict) {
|
||
ok = false;
|
||
}
|
||
if (overlong) {
|
||
draining_overlong_line = true;
|
||
}
|
||
continue;
|
||
}
|
||
|
||
if (line[len - 1] == '\n') {
|
||
line[len - 1] = 0;
|
||
len--;
|
||
}
|
||
|
||
parsed_lines++;
|
||
|
||
// coreutils does not attempt to restrict relative or absolute paths in the
|
||
// input so nor does this code.
|
||
std::string calculated_hex_digest;
|
||
const std::string target_filename(&line[hex_size + 2]);
|
||
Source target_source;
|
||
if (target_filename == "-") {
|
||
// coreutils reads from stdin if the filename is "-".
|
||
target_source = Source(Source::STDIN);
|
||
} else {
|
||
target_source = Source(target_filename);
|
||
}
|
||
|
||
if (!SumFile(&calculated_hex_digest, md, target_source)) {
|
||
error_lines++;
|
||
ok = false;
|
||
continue;
|
||
}
|
||
|
||
if (calculated_hex_digest != std::string(line, hex_size)) {
|
||
bad_hash_lines++;
|
||
if (!args.status) {
|
||
printf("%s: FAILED\n", target_filename.c_str());
|
||
}
|
||
ok = false;
|
||
continue;
|
||
}
|
||
|
||
if (!args.quiet) {
|
||
printf("%s: OK\n", target_filename.c_str());
|
||
}
|
||
}
|
||
|
||
if (!args.status) {
|
||
if (bad_lines > 0 && parsed_lines > 0) {
|
||
fprintf(stderr, "WARNING: %u line%s improperly formatted\n", bad_lines,
|
||
bad_lines == 1 ? " is" : "s are");
|
||
}
|
||
if (error_lines > 0) {
|
||
fprintf(stderr, "WARNING: %u computed checksum(s) did NOT match\n",
|
||
error_lines);
|
||
}
|
||
}
|
||
|
||
if (parsed_lines == 0) {
|
||
fprintf(stderr, "%s: no properly formatted checksum lines found.\n",
|
||
source.is_stdin() ? kStdinName : source.filename().c_str());
|
||
ok = false;
|
||
}
|
||
|
||
return ok;
|
||
}
|
||
|
||
// DigestSum acts like the coreutils *sum utilites, with the given hash
|
||
// function.
|
||
static bool DigestSum(const EVP_MD *md,
|
||
const std::vector<std::string> &args) {
|
||
bool check_mode = false;
|
||
CheckModeArguments check_args;
|
||
bool check_mode_args_given = false;
|
||
std::vector<Source> sources;
|
||
|
||
auto it = args.begin();
|
||
while (it != args.end()) {
|
||
const std::string &arg = *it;
|
||
if (!arg.empty() && arg[0] != '-') {
|
||
break;
|
||
}
|
||
|
||
it++;
|
||
|
||
if (arg == "--") {
|
||
break;
|
||
}
|
||
|
||
if (arg == "-") {
|
||
// "-" ends the argument list and indicates that stdin should be used.
|
||
sources.push_back(Source(Source::STDIN));
|
||
break;
|
||
}
|
||
|
||
if (arg.size() >= 2 && arg[0] == '-' && arg[1] != '-') {
|
||
for (size_t i = 1; i < arg.size(); i++) {
|
||
switch (arg[i]) {
|
||
case 'b':
|
||
case 't':
|
||
// Binary/text mode – irrelevent, even on Windows.
|
||
break;
|
||
case 'c':
|
||
check_mode = true;
|
||
break;
|
||
case 'w':
|
||
check_mode_args_given = true;
|
||
check_args.warn = true;
|
||
break;
|
||
default:
|
||
fprintf(stderr, "Unknown option '%c'.\n", arg[i]);
|
||
return false;
|
||
}
|
||
}
|
||
} else if (arg == "--binary" || arg == "--text") {
|
||
// Binary/text mode – irrelevent, even on Windows.
|
||
} else if (arg == "--check") {
|
||
check_mode = true;
|
||
} else if (arg == "--quiet") {
|
||
check_mode_args_given = true;
|
||
check_args.quiet = true;
|
||
} else if (arg == "--status") {
|
||
check_mode_args_given = true;
|
||
check_args.status = true;
|
||
} else if (arg == "--warn") {
|
||
check_mode_args_given = true;
|
||
check_args.warn = true;
|
||
} else if (arg == "--strict") {
|
||
check_mode_args_given = true;
|
||
check_args.strict = true;
|
||
} else {
|
||
fprintf(stderr, "Unknown option '%s'.\n", arg.c_str());
|
||
return false;
|
||
}
|
||
}
|
||
|
||
if (check_mode_args_given && !check_mode) {
|
||
fprintf(
|
||
stderr,
|
||
"Check mode arguments are only meaningful when verifying checksums.\n");
|
||
return false;
|
||
}
|
||
|
||
for (; it != args.end(); it++) {
|
||
sources.push_back(Source(*it));
|
||
}
|
||
|
||
if (sources.empty()) {
|
||
sources.push_back(Source(Source::STDIN));
|
||
}
|
||
|
||
bool ok = true;
|
||
|
||
if (check_mode) {
|
||
for (auto &source : sources) {
|
||
ok &= Check(check_args, md, source);
|
||
}
|
||
} else {
|
||
for (auto &source : sources) {
|
||
ok &= PrintFileSum(md, source);
|
||
}
|
||
}
|
||
|
||
return ok;
|
||
}
|
||
|
||
bool MD5Sum(const std::vector<std::string> &args) {
|
||
return DigestSum(EVP_md5(), args);
|
||
}
|
||
|
||
bool SHA1Sum(const std::vector<std::string> &args) {
|
||
return DigestSum(EVP_sha1(), args);
|
||
}
|
||
|
||
bool SHA224Sum(const std::vector<std::string> &args) {
|
||
return DigestSum(EVP_sha224(), args);
|
||
}
|
||
|
||
bool SHA256Sum(const std::vector<std::string> &args) {
|
||
return DigestSum(EVP_sha256(), args);
|
||
}
|
||
|
||
bool SHA384Sum(const std::vector<std::string> &args) {
|
||
return DigestSum(EVP_sha384(), args);
|
||
}
|
||
|
||
bool SHA512Sum(const std::vector<std::string> &args) {
|
||
return DigestSum(EVP_sha512(), args);
|
||
}
|