/* * This file is part of NetSurf, http://netsurf.sourceforge.net/ * Licensed under the GNU General Public License, * http://www.opensource.org/licenses/gpl-license * Copyright 2003 James Bursa * Copyright 2003 Phil Mellor * Copyright 2003 John M Bell */ #include #include #include #include #include #include #include #include #include #include "libxml/encoding.h" #include "libxml/uri.h" #include "netsurf/utils/config.h" #ifdef riscos #include "netsurf/riscos/about.h" #include "netsurf/riscos/constdata.h" #endif #include "netsurf/utils/log.h" #include "netsurf/utils/messages.h" #include "netsurf/utils/utils.h" void die(const char * const error) { fprintf(stderr, "Fatal: %s\n", error); exit(EXIT_FAILURE); } char * strip(char * const s) { size_t i; for (i = strlen(s); i != 0 && isspace(s[i-1]); i--) ; s[i] = 0; return s + strspn(s, " \t\r\n"); } int whitespace(const char * str) { unsigned int i; for (i = 0; i < strlen(str); i++) if (!isspace(str[i])) return 0; return 1; } void * xcalloc(const size_t n, const size_t size) { void * p = calloc(n, size); if (p == 0) die("Out of memory in xcalloc()"); return p; } void * xrealloc(void * p, const size_t size) { p = realloc(p, size); if (p == 0) die("Out of memory in xrealloc()"); return p; } void xfree(void* p) { if (p == 0) fprintf(stderr, "Attempt to free NULL pointer\n"); else free(p); } char * xstrdup(const char * const s) { char * c = malloc(strlen(s) + 1); if (c == 0) die("Out of memory in xstrdup()"); strcpy(c, s); return c; } char * load(const char * const path) { FILE * fp = fopen(path, "rb"); char * buf; long size, read; if (fp == 0) die("Failed to open file"); if (fseek(fp, 0, SEEK_END) != 0) die("fseek() failed"); if ((size = ftell(fp)) == -1) die("ftell() failed"); buf = xcalloc((size_t) size, 1); if (fseek(fp, 0, SEEK_SET) != 0) die("fseek() failed"); read = fread(buf, 1, (size_t) size, fp); if (read < size) die("fread() failed"); return buf; } char * squash_whitespace(const char * s) { char * c = malloc(strlen(s) + 1); int i = 0, j = 0; if (c == 0) die("Out of memory in squash_whitespace()"); do { if (isspace(s[i])) { c[j++] = ' '; while (s[i] != 0 && isspace(s[i])) i++; } c[j++] = s[i++]; } while (s[i - 1] != 0); return c; } char * tolat1(xmlChar * s) { unsigned int length = strlen((char*) s); unsigned int space = length + 100; char *d = xcalloc(space, sizeof(char)); char *d0 = d; char *end = d0 + space - 10; int u, chars; while (*s != 0) { chars = length; u = xmlGetUTF8Char((unsigned char *) s, &chars); if (chars <= 0) { s += 1; length -= 1; LOG(("UTF-8 error")); continue; } s += chars; length -= chars; if (u == 0x09 || u == 0x0a || u == 0x0d) *d++ = ' '; else if ((0x20 <= u && u <= 0x7f) || (0xa0 <= u && u <= 0xff)) *d++ = u; else { unicode_transliterate((unsigned int) u, &d); if (end < d) { space += 100; d0 = xrealloc(d0, space); end = d0 + space - 10; } } } *d = 0; return d0; } char * tolat1_pre(xmlChar * s) { unsigned int length = strlen((char*) s); char *d = xcalloc(length + 1, sizeof(char)); char *d0 = d; int u, chars; while (*s != 0) { chars = length; u = xmlGetUTF8Char((unsigned char *) s, &chars); s += chars; length -= chars; if (u == 0x09 || u == 0x0a || u == 0x0d || (0x20 <= u && u <= 0x7f) || (0xa0 <= u && u <= 0xff)) *d = u; else *d = '?'; d++; } *d = 0; return d0; } char *squash_tolat1(xmlChar *s) { /* TODO: optimize */ char *lat1 = tolat1(s); char *squash = squash_whitespace(lat1); free(lat1); return squash; } /** * Calculate a URL from a relative and base URL. * * base may be 0 for a new URL, in which case the URL is canonicalized and * returned. Returns 0 in case of error. */ char *url_join(char *rel_url, char *base_url) { char *res; uri_t *base = 0, *rel = 0, *abs; LOG(("rel_url = %s, base_url = %s", rel_url, base_url)); #ifdef riscos /* hacky, hacky, hacky... * It is, however, best to do this here as it avoids * duplicating code for clicking links and url bar handling. * It simplifies the code it the other places too (they just * call this as usual, then we handle it here). */ #ifdef WITH_ABOUT if (strcasecmp(rel_url, "about:") == 0) { about_create(); return xstrdup(ABOUT_URL); } #ifdef WITH_COOKIES else if (strcasecmp(rel_url, "about:cookies") == 0) { cookie_create(); return xstrdup(COOKIE_URL); } #endif else #endif if (strcasecmp(rel_url, "help:") == 0) { return xstrdup(HELP_URL); } else if (strcasecmp(rel_url, "home:") == 0) { return xstrdup(HOME_URL); } #endif if (!base_url) { res = uri_cannonicalize_string(rel_url, (int)(strlen(rel_url)), URI_STRING_URI_STYLE); LOG(("res = %s", res)); if (res) return xstrdup(res); return 0; } base = uri_alloc(base_url, (int)(strlen(base_url))); rel = uri_alloc(rel_url, (int)(strlen(rel_url))); if (!base || !rel) goto fail; if (!base->scheme) goto fail; abs = uri_abs_1(base, rel); res = xstrdup(uri_uri(abs)); uri_free(base); uri_free(rel); LOG(("res = %s", res)); return res; fail: if (base) uri_free(base); if (rel) uri_free(rel); LOG(("error")); return 0; } /** * Extract the host name from a url. * * \param url an absolute URL * \return a new string, or 0 in case of error */ char *get_host_from_url(char *url) { char *host = 0; uri_t *uri; uri = uri_alloc(url, (int)(strlen(url))); if (!uri) return 0; if (uri->host) host = xstrdup(uri->host); uri_free(uri); return host; } /** * Check if a directory exists. */ bool is_dir(const char *path) { struct stat s; if (stat(path, &s)) return false; return S_ISDIR(s.st_mode) ? true : false; } /** * Compile a regular expression, handling errors. * * Parameters as for regcomp(), see man regex. */ void regcomp_wrapper(regex_t *preg, const char *regex, int cflags) { char errbuf[200]; int r; r = regcomp(preg, regex, cflags); if (r) { regerror(r, preg, errbuf, sizeof errbuf); fprintf(stderr, "Failed to compile regexp '%s'\n", regex); die(errbuf); } } /** * Remove expired cookies from the cookie jar. * libcurl /really/ should do this for us. * This gets called every time a window is closed or NetSurf is quit. */ #ifdef WITH_COOKIES void clean_cookiejar(void) { FILE *fp; int len; char *cookies = 0, *pos; char domain[256], flag[10], path[256], secure[10], exp[50], name[256], val[256]; long int expiry; fp = fopen(messages_get("cookiefile"), "r"); if (!fp) { LOG(("Failed to open cookie jar")); return; } /* read file length */ fseek(fp, 0, SEEK_END); len = ftell(fp); fseek(fp, 0, SEEK_SET); cookies = xcalloc((unsigned int)len, sizeof(char)); fread(cookies, (unsigned int)len, sizeof(char), fp); fclose(fp); if (remove(messages_get("cookiejar"))) { LOG(("Failed to remove old jar")); xfree(cookies); return; } fp = fopen(messages_get("cookiejar"), "w+"); if (!fp) { xfree(cookies); LOG(("Failed to create new jar")); return; } /* write header */ fputs("# Netscape HTTP Cookie File\n" "# http://www.netscape.com/newsref/std/cookie_spec.html\n" "# This file was generated by libcurl! Edit at your own risk.\n\n", fp); pos = cookies; while (pos != (cookies+len-1)) { if (*pos == '#') { for (; *pos != '\n'; pos++); pos += 1; continue; } sscanf(pos, "%s\t%s\t%s\t%s\t%s\t%s\t%s\n", domain, flag, path, secure, exp, name, val); pos += (strlen(domain) + strlen(flag) + strlen(path) + strlen(secure) + strlen(exp) + strlen(name) + strlen(val) + 7); sscanf(exp, "%ld", &expiry); if (time(NULL) < expiry) { /* cookie hasn't expired */ fprintf(fp, "%s\t%s\t%s\t%s\t%s\t%s\t%s\n", domain, flag, path, secure, exp, name, val); } } fclose(fp); xfree(cookies); } #endif