304 lines
9.3 KiB
C
304 lines
9.3 KiB
C
/*
|
|
* Copyright(c) 2014-2018 Tim Ruehsen
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
* DEALINGS IN THE SOFTWARE.
|
|
*
|
|
* This file is part of libpsl.
|
|
*
|
|
* Using the libpsl functions via command line
|
|
*
|
|
* Changelog
|
|
* 11.04.2014 Tim Ruehsen created
|
|
*
|
|
*/
|
|
|
|
#if HAVE_CONFIG_H
|
|
# include <config.h>
|
|
#endif
|
|
|
|
#ifdef HAVE_UNISTD_H
|
|
# include <unistd.h>
|
|
#endif
|
|
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <ctype.h>
|
|
#include <locale.h>
|
|
|
|
#include <libpsl.h>
|
|
|
|
static void usage(int err, FILE* f)
|
|
{
|
|
fprintf(f, "Usage: psl [options] <domains...>\n");
|
|
fprintf(f, "\n");
|
|
fprintf(f, "Options:\n");
|
|
fprintf(f, " --version show library version information\n");
|
|
fprintf(f, " --use-latest-data use the latest PSL data available [default]\n");
|
|
fprintf(f, " --use-builtin-data use the builtin PSL data\n");
|
|
fprintf(f, " --no-star-rule do not apply the prevailing star rule\n");
|
|
fprintf(f, " (only applies to --is-public-suffix)\n");
|
|
fprintf(f, " --load-psl-file <filename> load PSL data from file\n");
|
|
fprintf(f, " --is-public-suffix check if domains are public suffixes [default]\n");
|
|
fprintf(f, " --is-cookie-domain-acceptable <cookie-domain>\n");
|
|
fprintf(f, " check if cookie-domain is acceptable for domains\n");
|
|
fprintf(f, " --print-unreg-domain print the longest public suffix part\n");
|
|
fprintf(f, " --print-reg-domain print the shortest private suffix part\n");
|
|
fprintf(f, " --print-info print info about library builtin data\n");
|
|
fprintf(f, " -b, --batch don't print leading domain\n");
|
|
fprintf(f, "\n");
|
|
|
|
exit(err);
|
|
}
|
|
|
|
/* RFC 2822-compliant date format */
|
|
static const char *time2str(time_t t)
|
|
{
|
|
static char buf[64];
|
|
struct tm *tp = localtime(&t);
|
|
|
|
strftime(buf, sizeof(buf), "%a, %d %b %Y %H:%M:%S %Z", tp);
|
|
return buf;
|
|
}
|
|
|
|
int main(int argc, const char *const *argv)
|
|
{
|
|
int mode = 1, no_star_rule = 0, batch_mode = 0;
|
|
const char *const *arg, *psl_file = NULL, *cookie_domain = NULL;
|
|
psl_ctx_t *psl = (psl_ctx_t *) psl_latest(NULL);
|
|
|
|
/* set current locale according to the environment variables */
|
|
setlocale(LC_ALL, "");
|
|
|
|
for (arg = argv + 1; arg < argv + argc; arg++) {
|
|
if (**arg == '-') {
|
|
if (!strcmp(*arg, "--is-public-suffix"))
|
|
mode = 1;
|
|
else if (!strcmp(*arg, "--print-unreg-domain"))
|
|
mode = 2;
|
|
else if (!strcmp(*arg, "--print-reg-domain"))
|
|
mode = 3;
|
|
else if (!strcmp(*arg, "--print-info"))
|
|
mode = 99;
|
|
else if (!strcmp(*arg, "--is-cookie-domain-acceptable") && arg < argv + argc - 1) {
|
|
mode = 4;
|
|
cookie_domain = *(++arg);
|
|
}
|
|
else if (!strcmp(*arg, "--use-latest-data")) {
|
|
psl_free(psl);
|
|
if (psl_file) {
|
|
fprintf(stderr, "Dropped data from %s\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
if (!(psl = (psl_ctx_t *) psl_latest(NULL)))
|
|
printf("No PSL data available\n");
|
|
}
|
|
else if (!strcmp(*arg, "--use-builtin-data")) {
|
|
psl_free(psl);
|
|
if (psl_file) {
|
|
fprintf(stderr, "Dropped data from %s\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
if (!(psl = (psl_ctx_t *) psl_builtin()))
|
|
printf("No builtin PSL data available\n");
|
|
}
|
|
else if (!strcmp(*arg, "--no-star-rule")) {
|
|
no_star_rule = 1;
|
|
}
|
|
else if (!strcmp(*arg, "--load-psl-file") && arg < argv + argc - 1) {
|
|
psl_free(psl);
|
|
if (psl_file) {
|
|
fprintf(stderr, "Dropped data from %s\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
if (!(psl = psl_load_file(psl_file = *(++arg)))) {
|
|
fprintf(stderr, "Failed to load PSL data from %s\n\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
}
|
|
else if (!strcmp(*arg, "--batch") || !strcmp(*arg, "-b")) {
|
|
batch_mode = 1;
|
|
}
|
|
else if (!strcmp(*arg, "--help")) {
|
|
fprintf(stdout, "`psl' explores the Public Suffix List\n\n");
|
|
usage(0, stdout);
|
|
}
|
|
else if (!strcmp(*arg, "--version")) {
|
|
printf("psl %s (0x%06x)\n", PACKAGE_VERSION, psl_check_version_number(0));
|
|
printf("libpsl %s\n", psl_get_version());
|
|
printf("\n");
|
|
printf("Copyright (C) 2014-2018 Tim Ruehsen\n");
|
|
printf("License: MIT\n");
|
|
exit(0);
|
|
}
|
|
else if (!strcmp(*arg, "--")) {
|
|
arg++;
|
|
break;
|
|
}
|
|
else {
|
|
fprintf(stderr, "Unknown option '%s'\n", *arg);
|
|
usage(1, stderr);
|
|
}
|
|
} else
|
|
break;
|
|
}
|
|
|
|
if (mode != 99) {
|
|
if (mode != 1 && no_star_rule) {
|
|
fprintf(stderr, "--no-star-rule only combines with --is-public-suffix\n");
|
|
usage(1, stderr);
|
|
}
|
|
if (!psl) {
|
|
fprintf(stderr, "No PSL data available - aborting\n");
|
|
exit(2);
|
|
}
|
|
if (arg >= argv + argc) {
|
|
char buf[256], *domain, *lower;
|
|
size_t len;
|
|
psl_error_t rc;
|
|
|
|
/* read URLs from STDIN */
|
|
while (fgets(buf, sizeof(buf), stdin)) {
|
|
for (domain = buf; isspace(*domain); domain++); /* skip leading spaces */
|
|
if (*domain == '#' || !*domain) continue; /* skip empty lines and comments */
|
|
for (len = strlen(domain); len && isspace(domain[len - 1]); len--); /* skip trailing spaces */
|
|
domain[len] = 0;
|
|
|
|
if ((rc = psl_str_to_utf8lower(domain, NULL, NULL, &lower)) != PSL_SUCCESS) {
|
|
fprintf(stderr, "%s: Failed to convert to lowercase UTF-8 (%d)\n", domain, rc);
|
|
continue;
|
|
}
|
|
|
|
if (!batch_mode && mode != 4)
|
|
printf("%s: ", domain);
|
|
|
|
if (mode == 1) {
|
|
if (no_star_rule)
|
|
printf("%d", psl_is_public_suffix2(psl, lower, PSL_TYPE_ANY|PSL_TYPE_NO_STAR_RULE));
|
|
else
|
|
printf("%d", psl_is_public_suffix(psl, lower));
|
|
|
|
if (!batch_mode)
|
|
printf(" (%s)\n", lower);
|
|
else
|
|
putchar('\n');
|
|
}
|
|
else if (mode == 2) {
|
|
const char *dom = psl_unregistrable_domain(psl, lower);
|
|
printf("%s\n", dom ? dom : "(null)");
|
|
}
|
|
else if (mode == 3) {
|
|
const char *dom = psl_registrable_domain(psl, lower);
|
|
printf("%s\n", dom ? dom : "(null)");
|
|
}
|
|
else if (mode == 4) {
|
|
char *cookie_domain_lower;
|
|
|
|
if ((rc = psl_str_to_utf8lower(domain, NULL, NULL, &cookie_domain_lower)) == PSL_SUCCESS) {
|
|
if (!batch_mode)
|
|
printf("%s: ", domain);
|
|
printf("%d\n", psl_is_cookie_domain_acceptable(psl, lower, cookie_domain));
|
|
free(cookie_domain_lower);
|
|
} else
|
|
fprintf(stderr, "%s: Failed to convert cookie domain '%s' to lowercase UTF-8 (%d)\n", domain, cookie_domain, rc);
|
|
}
|
|
|
|
psl_free_string(lower);
|
|
}
|
|
|
|
psl_free(psl);
|
|
exit(0);
|
|
}
|
|
}
|
|
|
|
if (mode == 1) {
|
|
for (; arg < argv + argc; arg++) {
|
|
if (!batch_mode)
|
|
printf("%s: ", *arg);
|
|
if (no_star_rule)
|
|
printf("%d\n", psl_is_public_suffix2(psl, *arg, PSL_TYPE_ANY|PSL_TYPE_NO_STAR_RULE));
|
|
else
|
|
printf("%d\n", psl_is_public_suffix(psl, *arg));
|
|
}
|
|
}
|
|
else if (mode == 2) {
|
|
for (; arg < argv + argc; arg++) {
|
|
const char *dom = psl_unregistrable_domain(psl, *arg);
|
|
if (!batch_mode)
|
|
printf("%s: ", *arg);
|
|
printf("%s\n", dom ? dom : "(null)");
|
|
}
|
|
}
|
|
else if (mode == 3) {
|
|
for (; arg < argv + argc; arg++) {
|
|
const char *dom = psl_registrable_domain(psl, *arg);
|
|
if (!batch_mode)
|
|
printf("%s: ", *arg);
|
|
printf("%s\n", dom ? dom : "(null)");
|
|
}
|
|
}
|
|
else if (mode == 4) {
|
|
for (; arg < argv + argc; arg++) {
|
|
if (!batch_mode)
|
|
printf("%s: ", *arg);
|
|
printf("%d\n", psl_is_cookie_domain_acceptable(psl, *arg, cookie_domain));
|
|
}
|
|
}
|
|
else if (mode == 99) {
|
|
printf("dist filename: %s\n", psl_dist_filename());
|
|
|
|
if (psl && psl != psl_builtin()) {
|
|
static char not_avail[] = "- information not available -";
|
|
int n;
|
|
|
|
if ((n = psl_suffix_count(psl)) >= 0)
|
|
printf("suffixes: %d\n", n);
|
|
else
|
|
printf("suffixes: %s\n", not_avail);
|
|
|
|
if ((n = psl_suffix_exception_count(psl)) >= 0)
|
|
printf("exceptions: %d\n", n);
|
|
else
|
|
printf("exceptions: %s\n", not_avail);
|
|
|
|
if ((n = psl_suffix_wildcard_count(psl)) >= 0)
|
|
printf("wildcards: %d\n", n);
|
|
else
|
|
printf("wildcards: %s\n", not_avail);
|
|
}
|
|
|
|
psl_free(psl);
|
|
psl = (psl_ctx_t *) psl_builtin();
|
|
|
|
if (psl) {
|
|
printf("builtin suffixes: %d\n", psl_suffix_count(psl));
|
|
printf("builtin exceptions: %d\n", psl_suffix_exception_count(psl));
|
|
printf("builtin wildcards: %d\n", psl_suffix_wildcard_count(psl));
|
|
printf("builtin filename: %s\n", psl_builtin_filename());
|
|
printf("builtin file time: %ld (%s)\n", (long) psl_builtin_file_time(), time2str(psl_builtin_file_time()));
|
|
printf("builtin SHA1 file hash: %s\n", psl_builtin_sha1sum());
|
|
printf("builtin outdated: %d\n", psl_builtin_outdated());
|
|
} else
|
|
printf("No builtin PSL data available\n");
|
|
}
|
|
|
|
psl_free(psl);
|
|
|
|
return 0;
|
|
}
|