From c79bd8e49c8035ec657bd2b6f98507e0f9164ca7 Mon Sep 17 00:00:00 2001 From: Eric van der Vlist Date: Sat, 28 Apr 2012 09:42:21 +0200 Subject: [PATCH] Forcing HTML content type for XHTML documents --- archiver/pipelines/actions/mediatypes/warc-html.xpl | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/archiver/pipelines/actions/mediatypes/warc-html.xpl b/archiver/pipelines/actions/mediatypes/warc-html.xpl index 7d30e57..f7411d1 100644 --- a/archiver/pipelines/actions/mediatypes/warc-html.xpl +++ b/archiver/pipelines/actions/mediatypes/warc-html.xpl @@ -11,6 +11,8 @@ session + utf-8 + true @@ -24,6 +26,10 @@ + utf-8 + true + text/html + true html