summaryrefslogtreecommitdiff
path: root/sys/src/cmd/htmlfmt/html.c
diff options
context:
space:
mode:
authorcinap_lenrek <cinap_lenrek@felloff.net>2014-05-12 02:38:53 +0200
committercinap_lenrek <cinap_lenrek@felloff.net>2014-05-12 02:38:53 +0200
commit679b092ee02429b444b3e8995f6db11b42008dad (patch)
treeb5d9321c93474ca4c8c356cac87034386c63f666 /sys/src/cmd/htmlfmt/html.c
parent66f76c28212d3a25d4b039de2ce817fc74c5ca1e (diff)
htmlfmt: use uhtml for character set conversion
Diffstat (limited to 'sys/src/cmd/htmlfmt/html.c')
-rw-r--r--sys/src/cmd/htmlfmt/html.c31
1 files changed, 2 insertions, 29 deletions
diff --git a/sys/src/cmd/htmlfmt/html.c b/sys/src/cmd/htmlfmt/html.c
index fc3ea4915..5f9ea86be 100644
--- a/sys/src/cmd/htmlfmt/html.c
+++ b/sys/src/cmd/htmlfmt/html.c
@@ -285,40 +285,13 @@ rerender(URLwin *u)
free(t);
}
-/*
- * Somewhat of a hack. Not a full parse, just looks for strings in the beginning
- * of the document (cistrstr only looks at first somewhat bytes).
- */
-int
-charset(char *s)
-{
- char *meta, *emeta, *charset;
-
- if(defcharset == 0)
- defcharset = ISO_8859_1;
- meta = cistrstr(s, "<meta");
- if(meta == nil)
- return defcharset;
- for(emeta=meta; *emeta!='>' && *emeta!='\0'; emeta++)
- ;
- charset = cistrstr(s, "charset=");
- if(charset == nil)
- return defcharset;
- charset += 8;
- if(*charset == '"')
- charset++;
- if(cistrncmp(charset, "utf-8", 5) || cistrncmp(charset, "utf8", 4))
- return UTF_8;
- return defcharset;
-}
-
void
rendertext(URLwin *u, Bytes *b)
{
Rune *rurl;
- rurl = toStr((uchar*)u->url, strlen(u->url), ISO_8859_1);
- u->items = parsehtml(b->b, b->n, rurl, u->type, charset((char*)b->b), &u->docinfo);
+ rurl = toStr((uchar*)u->url, strlen(u->url), UTF_8);
+ u->items = parsehtml(b->b, b->n, rurl, u->type, UTF_8, &u->docinfo);
// free(rurl);
rerender(u);