229 lines
7.3 KiB
C
229 lines
7.3 KiB
C
/*
|
|
* Copyright(c) 2014 Tim Ruehsen
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
* DEALINGS IN THE SOFTWARE.
|
|
*
|
|
* This file is part of libpsl.
|
|
*
|
|
* Using the libpsl functions via command line
|
|
*
|
|
* Changelog
|
|
* 11.04.2014 Tim Ruehsen created
|
|
*
|
|
*/
|
|
|
|
#if HAVE_CONFIG_H
|
|
# include <config.h>
|
|
#endif
|
|
|
|
#include <unistd.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <ctype.h>
|
|
#include <libpsl.h>
|
|
|
|
static void usage(int err, FILE* f)
|
|
{
|
|
fprintf(f, "Usage: psl [options] <domains...>\n");
|
|
fprintf(f, "\n");
|
|
fprintf(f, "Options:\n");
|
|
fprintf(f, " --version show library version information\n");
|
|
fprintf(f, " --use-builtin-data use the builtin PSL data [default]\n");
|
|
fprintf(f, " --load-psl-file <filename> load PSL data from file\n");
|
|
fprintf(f, " --is-public-suffix check if domains are public suffixes [default]\n");
|
|
fprintf(f, " --is-cookie-domain-acceptable <cookie-domain>\n");
|
|
fprintf(f, " check if cookie-domain is acceptable for domains\n");
|
|
fprintf(f, " --print-unreg-domain print the longest publix suffix part\n");
|
|
fprintf(f, " --print-reg-domain print the shortest private suffix part\n");
|
|
fprintf(f, " --print-info print info about library builtin data\n");
|
|
fprintf(f, "\n");
|
|
|
|
exit(err);
|
|
}
|
|
|
|
/* RFC 2822-compliant date format */
|
|
static const char *time2str(time_t t)
|
|
{
|
|
static char buf[64];
|
|
struct tm *tp = localtime(&t);
|
|
|
|
strftime(buf, sizeof(buf), "%a, %d %b %Y %H:%M:%S %Z", tp);
|
|
return buf;
|
|
}
|
|
|
|
int main(int argc, const char *const *argv)
|
|
{
|
|
int mode = 1;
|
|
const char *const *arg, *psl_file = NULL, *cookie_domain = NULL;
|
|
psl_ctx_t *psl = (psl_ctx_t *) psl_builtin();
|
|
|
|
/* set current locale according to the environment variables */
|
|
#include <locale.h>
|
|
setlocale(LC_ALL, "");
|
|
|
|
for (arg = argv + 1; arg < argv + argc; arg++) {
|
|
if (!strncmp(*arg, "--", 2)) {
|
|
if (!strcmp(*arg, "--is-public-suffix"))
|
|
mode = 1;
|
|
else if (!strcmp(*arg, "--print-unreg-domain"))
|
|
mode = 2;
|
|
else if (!strcmp(*arg, "--print-reg-domain"))
|
|
mode = 3;
|
|
else if (!strcmp(*arg, "--print-info"))
|
|
mode = 99;
|
|
else if (!strcmp(*arg, "--is-cookie-domain-acceptable") && arg < argv + argc - 1) {
|
|
mode = 4;
|
|
cookie_domain = *(++arg);
|
|
}
|
|
else if (!strcmp(*arg, "--use-builtin-data")) {
|
|
psl_free(psl);
|
|
if (psl_file) {
|
|
fprintf(stderr, "Dropped data from %s\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
if (!(psl = (psl_ctx_t *) psl_builtin()))
|
|
printf("No builtin PSL data available\n");
|
|
}
|
|
else if (!strcmp(*arg, "--load-psl-file") && arg < argv + argc - 1) {
|
|
psl_free(psl);
|
|
if (psl_file) {
|
|
fprintf(stderr, "Dropped data from %s\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
if (!(psl = psl_load_file(psl_file = *(++arg)))) {
|
|
fprintf(stderr, "Failed to load PSL data from %s\n\n", psl_file);
|
|
psl_file = NULL;
|
|
}
|
|
}
|
|
else if (!strcmp(*arg, "--help")) {
|
|
fprintf(stdout, "`psl' explores the Public Suffix List\n\n");
|
|
usage(0, stdout);
|
|
}
|
|
else if (!strcmp(*arg, "--version")) {
|
|
printf("psl %s\n", PACKAGE_VERSION);
|
|
printf("libpsl %s\n", psl_get_version());
|
|
printf("\n");
|
|
printf("Copyright (C) 2014 Tim Ruehsen\n");
|
|
printf("License: MIT\n");
|
|
exit(0);
|
|
}
|
|
else if (!strcmp(*arg, "--")) {
|
|
arg++;
|
|
break;
|
|
}
|
|
else {
|
|
fprintf(stderr, "Unknown option '%s'\n", *arg);
|
|
usage(1, stderr);
|
|
}
|
|
} else
|
|
break;
|
|
}
|
|
|
|
if (mode != 99) {
|
|
if (!psl) {
|
|
fprintf(stderr, "No PSL data available - aborting\n");
|
|
exit(2);
|
|
}
|
|
if (arg >= argv + argc) {
|
|
char buf[256], *domain, *lower;
|
|
size_t len;
|
|
int rc;
|
|
|
|
// read URLs from STDIN
|
|
while (fgets(buf, sizeof(buf), stdin)) {
|
|
for (domain = buf; isspace(*domain); domain++); // skip leading spaces
|
|
if (*domain == '#' || !*domain) continue; // skip empty lines and comments
|
|
for (len = strlen(domain); len && isspace(domain[len - 1]); len--); // skip trailing spaces
|
|
domain[len] = 0;
|
|
|
|
if ((rc = psl_str_to_utf8lower(domain, NULL, NULL, &lower)) != 0)
|
|
fprintf(stderr, "%s: Failed to convert to lowercase UTF-8 (%d)\n", domain, rc);
|
|
else if (mode == 1)
|
|
printf("%s: %d (%s)\n", domain, psl_is_public_suffix(psl, lower), lower);
|
|
else if (mode == 2)
|
|
printf("%s: %s\n", domain, psl_unregistrable_domain(psl, lower));
|
|
else if (mode == 3)
|
|
printf("%s: %s\n", domain, psl_registrable_domain(psl, lower));
|
|
else if (mode == 4) {
|
|
char *cookie_domain_lower;
|
|
|
|
if ((rc = psl_str_to_utf8lower(domain, NULL, NULL, &cookie_domain_lower)) != 0)
|
|
fprintf(stderr, "%s: Failed to convert cookie domain '%s' to lowercase UTF-8 (%d)\n", domain, cookie_domain, rc);
|
|
else
|
|
printf("%s: %d\n", domain, psl_is_cookie_domain_acceptable(psl, lower, cookie_domain));
|
|
|
|
free(cookie_domain_lower);
|
|
}
|
|
|
|
free(lower);
|
|
}
|
|
|
|
psl_free(psl);
|
|
exit(0);
|
|
}
|
|
}
|
|
|
|
if (mode == 1) {
|
|
for (; arg < argv + argc; arg++)
|
|
printf("%s: %d\n", *arg, psl_is_public_suffix(psl, *arg));
|
|
}
|
|
else if (mode == 2) {
|
|
for (; arg < argv + argc; arg++)
|
|
printf("%s: %s\n", *arg, psl_unregistrable_domain(psl, *arg));
|
|
}
|
|
else if (mode == 3) {
|
|
for (; arg < argv + argc; arg++)
|
|
printf("%s: %s\n", *arg, psl_registrable_domain(psl, *arg));
|
|
}
|
|
else if (mode == 4) {
|
|
for (; arg < argv + argc; arg++)
|
|
printf("%s: %d\n", *arg, psl_is_cookie_domain_acceptable(psl, *arg, cookie_domain));
|
|
}
|
|
else if (mode == 99) {
|
|
if (psl && psl != psl_builtin()) {
|
|
printf("suffixes: %d\n", psl_suffix_count(psl));
|
|
printf("exceptions: %d\n", psl_suffix_exception_count(psl));
|
|
}
|
|
|
|
psl_free(psl);
|
|
psl = (psl_ctx_t *) psl_builtin();
|
|
|
|
if (psl) {
|
|
printf("builtin suffixes: %d\n", psl_suffix_count(psl));
|
|
printf("builtin exceptions: %d\n", psl_suffix_exception_count(psl));
|
|
printf("builtin filename: %s\n", psl_builtin_filename());
|
|
printf("builtin compile time: %ld (%s)\n", psl_builtin_compile_time(), time2str(psl_builtin_compile_time()));
|
|
printf("builtin file time: %ld (%s)\n", psl_builtin_file_time(), time2str(psl_builtin_file_time()));
|
|
printf("builtin SHA1 file hash: %s\n", psl_builtin_sha1sum());
|
|
|
|
#ifdef WITH_LIBICU
|
|
#include <unicode/uloc.h>
|
|
#include <unicode/ucnv.h>
|
|
printf("uloc_getDefault=%s\n", uloc_getDefault());
|
|
printf("ucnv_getDefaultName=%s\n", ucnv_getDefaultName());
|
|
#endif
|
|
} else
|
|
printf("No builtin PSL data available\n");
|
|
}
|
|
|
|
psl_free(psl);
|
|
|
|
return 0;
|
|
}
|