summaryrefslogtreecommitdiff
path: root/tests/tld-test.c
blob: 7be0ae7155b2ff45b4bf0f31edd7743346a6c460 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
/* -*- Mode: C; tab-width: 8; indent-tabs-mode: t; c-basic-offset: 8 -*- */
/*
 * Copyright (C) 2012 Igalia S.L.
 */

#include <glib.h>
#include <libsoup/soup.h>
#include <string.h>

#include "test-utils.h"

/* From http://publicsuffix.org/list/test.txt */
static struct {
  const char *hostname;
  const char *result;
} tld_tests[] = {
  /* NULL input. Not checked here because the API requires a valid hostname. */
  /* { NULL, NULL }, */
  /* Mixed case. Not checked because the API requires a valid hostname. */
  /* { "COM", NULL }, */
  /* { "example.COM", "example.com" }, */
  /* { "WwW.example.COM", "example.com" }, */
  /* Leading dot. */
  { ".com", NULL },
  { ".example", NULL },
  { ".example.com", NULL },
  { ".example.example", NULL },
  /* Unlisted TLD. Not checked because we do not want to force every URL to have a public suffix.*/
  /* { "example", NULL }, */
  /* { "example.example", NULL }, */
  /* { "b.example.example", NULL }, */
  /* { "a.b.example.example", NULL }, */
  /* Listed, but non-Internet, TLD. */
  /*{ "local", NULL }, */
  /*{ "example.local", NULL }, */
  /*{ "b.example.local", NULL }, */
  /*{ "a.b.example.local", NULL }, */
  /* TLD with only 1 rule. */
  { "biz", NULL },
  { "domain.biz", "domain.biz" },
  { "b.domain.biz", "domain.biz" },
  { "a.b.domain.biz", "domain.biz" },
  /* TLD with some 2-level rules. */
  { "com", NULL },
  { "example.com", "example.com" },
  { "b.example.com", "example.com" },
  { "a.b.example.com", "example.com" },
  { "uk.com", NULL },
  { "example.uk.com", "example.uk.com" },
  { "b.example.uk.com", "example.uk.com" },
  { "a.b.example.uk.com", "example.uk.com" },
  { "test.ac", "test.ac" },
  /* TLD with only 1 (wildcard) rule. */
  { "cy", NULL },
  { "c.cy", NULL },
  { "b.c.cy", "b.c.cy" },
  { "a.b.c.cy", "b.c.cy" },
  /* More complex TLD. */
  { "jp", NULL },
  { "test.jp", "test.jp" },
  { "www.test.jp", "test.jp" },
  { "ac.jp", NULL },
  { "test.ac.jp", "test.ac.jp" },
  { "www.test.ac.jp", "test.ac.jp" },
  { "kyoto.jp", NULL },
  { "c.kyoto.jp", NULL },
  { "b.c.kyoto.jp", "b.c.kyoto.jp" },
  { "a.b.c.kyoto.jp", "b.c.kyoto.jp" },
  { "pref.kyoto.jp", "pref.kyoto.jp" },	/* Exception rule. */
  { "www.pref.kyoto.jp", "pref.kyoto.jp" },	/* Exception rule. */
  { "city.kyoto.jp", "city.kyoto.jp" },	/* Exception rule. */
  { "www.city.kyoto.jp", "city.kyoto.jp" },	/* Exception rule. */
  /* TLD with a wildcard rule and exceptions. */
  { "om", NULL },
  { "test.om", NULL },
  { "b.test.om", "b.test.om" },
  { "a.b.test.om", "b.test.om" },
  { "songfest.om", "songfest.om" },
  { "www.songfest.om", "songfest.om" },
  /* US K12. */
  { "us", NULL },
  { "test.us", "test.us" },
  { "www.test.us", "test.us" },
  { "ak.us", NULL },
  { "test.ak.us", "test.ak.us" },
  { "www.test.ak.us", "test.ak.us" },
  { "k12.ak.us", NULL },
  { "test.k12.ak.us", "test.k12.ak.us" },
  { "www.test.k12.ak.us", "test.k12.ak.us" },
  /* This is not in http://publicsuffix.org/list/test.txt but we want to check it anyway. */
  { "co.uk", NULL },
  /* The original list does not include non-ASCII tests. Let's add a couple. */
  { "公司.cn", NULL },
  { "a.b.åfjord.no", "b.åfjord.no" }
};

int
main (int argc, char **argv)
{
	int i;

	test_init (argc, argv, NULL);

	errors = 0;
	for (i = 0; i < G_N_ELEMENTS (tld_tests); ++i) {
               gboolean is_public = soup_tld_domain_is_public_suffix (tld_tests[i].hostname);
               const char *base_domain = soup_tld_get_base_domain (tld_tests[i].hostname, NULL);

               if (tld_tests[i].result) {
                       /* Public domains have NULL expected results. */
                       if (is_public || g_strcmp0 (tld_tests[i].result, base_domain)) {
                               debug_printf (1, "ERROR: %s got %s (%s expected)\n",
                                             tld_tests[i].hostname, base_domain, tld_tests[i].result);
                               ++errors;
                       }
               } else {
                       /* If there is no expected result then either the domain is public or
                        * the hostname invalid (for example starts with a leading dot).
                        */
                       if (!is_public && base_domain) {
                               debug_printf (1, "ERROR: public domain %s got %s (none expected)\n",
                                             tld_tests[i].hostname, base_domain);
                               ++errors;
                       }
	       }
	}

	test_cleanup ();

	return errors != 0;
}