Subversion Repositories planix.SVN

Rev

Rev 2 | Blame | Compare with Previous | Last modification | View Log | RSS feed

#include <u.h>
#include <libc.h>
#include <bio.h>
#include <ndb.h>
#include "whois.h"

typedef struct Country Country;

struct Country
{
        char *code;
        char *name;
};

Country badc[] =
{
        {"af", "afghanistan"},
        {"cu", "cuba"},
        {"ir", "iran"},
        {"iq", "iraq"},
        {"ly", "libya"},
        {"kp", "north korea"},
        {"sd", "sudan"},
        {"sy", "syria"},
        { 0, 0 }
};

Country goodc[] =
{
        // the original, us and canada
        {"us", "united states of america"},
        {"ca", "canada"},
        {"gov", "gov"},
        {"mil", "mil"},

        // the european union
        { "eu", "european union" },
        { "be", "belgium" },
        { "de", "germany" },
        { "fr", "france" },
        { "it", "italy" },
        { "lu", "luxembourg" },
        { "nl", "netherlands" },
        { "dk", "denmark" },
        { "ie", "ireland" },
        { "gb", "great britain" },
        { "uk", "united kingdom" },
        { "gr", "greece" },
        { "es", "spain" },
        { "pt", "portugal" },
        { "au", "australia" },
        { "fi", "finland" },
        { "se", "sweden" },

        // the rest
        {"au", "australia"},
        {"no", "norway"},
        {"cz", "czech republic"},
        {"hu", "hungary"},
        {"pl", "poland"},
        {"jp", "japan"},
        {"ch", "switzerland"},
        {"nz", "new zealand"},
        { 0, 0 }
};

char *gov[] =
{
        "gov",
        "gouv",
        "mil",
        "government",
        0,
};

Country allc[] =
{
        { "ad", "andorra" },
        { "ae", "united arab emirates" },
        { "af", "afghanistan" },
        { "ag", "antigua and barbuda" },
        { "ai", "anguilla" },
        { "al", "albania" },
        { "am", "armenia" },
        { "an", "netherlands antilles" },
        { "ao", "angola" },
        { "aq", "antarctica" },
        { "ar", "argentina" },
        { "as", "american samoa" },
        { "at", "austria" },
        { "au", "australia" },
        { "aw", "aruba" },
        { "az", "azerbaijan" },
        { "ba", "bosnia and herzegovina" },
        { "bb", "barbados" },
        { "bd", "bangladesh" },
        { "be", "belgium" },
        { "bf", "burkina faso" },
        { "bg", "bulgaria" },
        { "bh", "bahrain" },
        { "bi", "burundi" },
        { "bj", "benin" },
        { "bm", "bermuda" },
        { "bn", "brunei darussalam" },
        { "bo", "bolivia" },
        { "br", "brazil" },
        { "bs", "bahamas" },
        { "bt", "bhutan" },
        { "bu", "burma" },
        { "bv", "bouvet island" },
        { "bw", "botswana" },
        { "by", "belarus" },
        { "bz", "belize" },
        { "ca", "canada" },
        { "cc", "cocos (keeling) islands" },
        { "cf", "central african republic" },
        { "cg", "congo" },
        { "ch", "switzerland" },
        { "ci", "cote d'ivoire (ivory coast)" },
        { "ck", "cook islands" },
        { "cl", "chile" },
        { "cm", "cameroon" },
        { "cn", "china" },
        { "co", "colombia" },
        { "cr", "costa rica" },
        { "cs", "czechoslovakia (former)" },
        { "ct", "canton and enderbury island" },
        { "cu", "cuba" },
        { "cv", "cape verde" },
        { "cx", "christmas island" },
        { "cy", "cyprus" },
        { "cz", "czech republic" },
        { "dd", "german democratic republic" },
        { "de", "germany" },
        { "dj", "djibouti" },
        { "dk", "denmark" },
        { "dm", "dominica" },
        { "do", "dominican republic" },
        { "dz", "algeria" },
        { "ec", "ecuador" },
        { "ee", "estonia" },
        { "eg", "egypt" },
        { "eh", "western sahara" },
        { "er", "eritrea" },
        { "es", "spain" },
        { "et", "ethiopia" },
        { "eu", "european union" },
        { "fi", "finland" },
        { "fj", "fiji" },
        { "fk", "falkland islands (malvinas)" },
        { "fm", "micronesia" },
        { "fo", "faroe islands" },
        { "fr", "france" },
        { "fx", "france, metropolitan" },
        { "ga", "gabon" },
        { "gb", "great britain (uk)" },
        { "gd", "grenada" },
        { "ge", "georgia" },
        { "gf", "french guiana" },
        { "gh", "ghana" },
        { "gi", "gibraltar" },
        { "gl", "greenland" },
        { "gm", "gambia" },
        { "gn", "guinea" },
        { "gp", "guadeloupe" },
        { "gq", "equatorial guinea" },
        { "gr", "greece" },
        { "gs", "s. georgia and s. sandwich isls." },
        { "gt", "guatemala" },
        { "gu", "guam" },
        { "gw", "guinea-bissau" },
        { "gy", "guyana" },
        { "hk", "hong kong" },
        { "hm", "heard and mcdonald islands" },
        { "hn", "honduras" },
        { "hr", "croatia (hrvatska)" },
        { "ht", "haiti" },
        { "hu", "hungary" },
        { "id", "indonesia" },
        { "ie", "ireland" },
        { "il", "israel" },
        { "in", "india" },
        { "io", "british indian ocean territory" },
        { "iq", "iraq" },
        { "ir", "iran" },
        { "is", "iceland" },
        { "it", "italy" },
        { "jm", "jamaica" },
        { "jo", "jordan" },
        { "jp", "japan" },
        { "jt", "johnston island" },
        { "ke", "kenya" },
        { "kg", "kyrgyzstan" },
        { "kh", "cambodia (democratic kampuchea)" },
        { "ki", "kiribati" },
        { "km", "comoros" },
        { "kn", "saint kitts and nevis" },
        { "kp", "korea (north)" },
        { "kr", "korea (south)" },
        { "kw", "kuwait" },
        { "ky", "cayman islands" },
        { "kz", "kazakhstan" },
        { "la", "laos" },
        { "lb", "lebanon" },
        { "lc", "saint lucia" },
        { "li", "liechtenstein" },
        { "lk", "sri lanka" },
        { "lr", "liberia" },
        { "ls", "lesotho" },
        { "lt", "lithuania" },
        { "lu", "luxembourg" },
        { "lv", "latvia" },
        { "ly", "libya" },
        { "ma", "morocco" },
        { "mc", "monaco" },
        { "md", "moldova" },
        { "mg", "madagascar" },
        { "mh", "marshall islands" },
        { "mi", "midway islands" },
        { "mk", "macedonia" },
        { "ml", "mali" },
        { "mm", "myanmar" },
        { "mn", "mongolia" },
        { "mo", "macau" },
        { "mp", "northern mariana islands" },
        { "mq", "martinique" },
        { "mr", "mauritania" },
        { "ms", "montserrat" },
        { "mt", "malta" },
        { "mu", "mauritius" },
        { "mv", "maldives" },
        { "mw", "malawi" },
        { "mx", "mexico" },
        { "my", "malaysia" },
        { "mz", "mozambique" },
        { "na", "namibia" },
        { "nc", "new caledonia" },
        { "ne", "niger" },
        { "nf", "norfolk island" },
        { "ng", "nigeria" },
        { "ni", "nicaragua" },
        { "nl", "netherlands" },
        { "no", "norway" },
        { "np", "nepal" },
        { "nq", "dronning maud land" },
        { "nr", "nauru" },
        { "nt", "neutral zone" },
        { "nu", "niue" },
        { "nz", "new zealand (aotearoa)" },
        { "om", "oman" },
        { "pa", "panama" },
        { "pc", "pacific islands" },
        { "pe", "peru" },
        { "pf", "french polynesia" },
        { "pg", "papua new guinea" },
        { "ph", "philippines" },
        { "pk", "pakistan" },
        { "pl", "poland" },
        { "pm", "st. pierre and miquelon" },
        { "pn", "pitcairn" },
        { "pr", "puerto rico" },
        { "pu", "united states misc. pacific islands" },
        { "pt", "portugal" },
        { "pw", "palau" },
        { "py", "paraguay" },
        { "qa", "qatar" },
        { "re", "reunion" },
        { "ro", "romania" },
        { "ru", "russian federation" },
        { "rw", "rwanda" },
        { "sa", "saudi arabia" },
        { "sb", "solomon islands" },
        { "sc", "seychelles" },
        { "sd", "sudan" },
        { "se", "sweden" },
        { "sg", "singapore" },
        { "sh", "st. helena" },
        { "si", "slovenia" },
        { "sj", "svalbard and jan mayen islands" },
        { "sk", "slovak republic" },
        { "sl", "sierra leone" },
        { "sm", "san marino" },
        { "sn", "senegal" },
        { "so", "somalia" },
        { "sr", "suriname" },
        { "st", "sao tome and principe" },
        { "su", "ussr (former)" },
        { "sv", "el salvador" },
        { "sy", "syria" },
        { "sz", "swaziland" },
        { "tc", "turks and caicos islands" },
        { "td", "chad" },
        { "tf", "french southern territories" },
        { "tg", "togo" },
        { "th", "thailand" },
        { "tj", "tajikistan" },
        { "tk", "tokelau" },
        { "tm", "turkmenistan" },
        { "tn", "tunisia" },
        { "to", "tonga" },
        { "tp", "east timor" },
        { "tr", "turkey" },
        { "tt", "trinidad and tobago" },
        { "tv", "tuvalu" },
        { "tw", "taiwan" },
        { "tz", "tanzania" },
        { "ua", "ukraine" },
        { "ug", "uganda" },
        { "uk", "united kingdom" },
        { "um", "us minor outlying islands" },
        { "us", "united states" },
        { "uy", "uruguay" },
        { "uz", "uzbekistan" },
        { "va", "vatican city state (holy see)" },
        { "vc", "saint vincent and the grenadines" },
        { "ve", "venezuela" },
        { "vg", "virgin islands (british)" },
        { "vi", "virgin islands (u.s.)" },
        { "vn", "viet nam" },
        { "vu", "vanuatu" },
        { "wf", "wallis and futuna islands" },
        { "wk", "wake island" },
        { "ws", "samoa" },
        { "yd", "democratic yemen" },
        { "ye", "yemen" },
        { "yt", "mayotte" },
        { "yu", "yugoslavia" },
        { "za", "south africa" },
        { "zm", "zambia" },
        { "zr", "zaire" },
        { "zw", "zimbabwe" },

        {"gov", "gov"},
        {"mil", "mil"},

        { 0, 0 }
};

int classdebug;

static int
incountries(char *s, Country *cp)
{
        for(; cp->code != 0; cp++)
                if(cistrcmp(s, cp->code) == 0
                || cistrcmp(s, cp->name) == 0)
                        return 1;
        return 0;
}

static int
indomains(char *s, char **dp)
{
        for(; *dp != nil; dp++)
                if(cistrcmp(s, *dp) == 0)
                        return 1;

        return 0;
}

int
classify(char *ip, Ndbtuple *t)
{
        int isgov, iscountry, isbadc, isgoodc;
        char dom[256];
        char *df[128];
        Ndbtuple *nt, *x;
        int n;

        isgov = iscountry = isbadc = 0;
        isgoodc = 1;
        
        for(nt = t; nt != nil; nt = nt->entry){
                if(strcmp(nt->attr, "country") == 0){
                        iscountry = 1;
                        if(incountries(nt->val, badc)){
                                if(classdebug)fprint(2, "isbadc\n");
                                isbadc = 1;
                                isgoodc = 0;
                        } else if(!incountries(nt->val, goodc)){
                                if(classdebug)fprint(2, "!isgoodc\n");
                                isgoodc = 0;
                        }
                }

                /* domain names can always hurt, even without forward verification */
                if(strcmp(nt->attr, "dom") == 0){
                        strncpy(dom, nt->val, sizeof dom);
                        dom[sizeof(dom)-1] = 0;
                        n = getfields(dom, df, nelem(df), 0, ".");

                        /* a bad country in a domain name is always believed */
                        if(incountries(df[n-1], badc)){
                                if(classdebug)fprint(2, "isbadc dom\n");
                                isbadc = 1;
                                isgoodc = 0;
                        }

                        /* a goverment in a domain name is always believed */
                        if(n > 1 && indomains(df[n-2], gov))
                                isgov = 1;
                }
        }
        if(iscountry == 0){
                /* did the forward lookup work? */
                for(nt = t; nt != nil; nt = nt->entry){
                        if(strcmp(nt->attr, "ip") == 0 && strcmp(nt->val, ip) == 0)
                                break;
                }

                /* see if the domain name ends in a country code */
                if(nt != nil && (x = ndbfindattr(t, nt, "dom")) != nil){
                        strncpy(dom, x->val, sizeof dom);
                        dom[sizeof(dom)-1] = 0;
                        n = getfields(dom, df, nelem(df), 0, ".");
                        if(incountries(df[n-1], allc))
                                iscountry = 1;
                }
        }
        if(iscountry == 0)
                return Cunknown;
        if(isbadc)
                return Cbadc;
        if(!isgoodc && isgov)
                return Cbadgov;
        return Cok;
}