diff --git a/archiver/pipelines/actions/mediatypes/warc-html.xpl b/archiver/pipelines/actions/mediatypes/warc-html.xpl index 7d30e57..f7411d1 100644 --- a/archiver/pipelines/actions/mediatypes/warc-html.xpl +++ b/archiver/pipelines/actions/mediatypes/warc-html.xpl @@ -11,6 +11,8 @@ session + utf-8 + true @@ -24,6 +26,10 @@ + utf-8 + true + text/html + true html