diff --git a/source/de/anomic/htmlFilter/htmlFilterContentScraper.java b/source/de/anomic/htmlFilter/htmlFilterContentScraper.java
index fa0d0d14e..94ed64288 100644
--- a/source/de/anomic/htmlFilter/htmlFilterContentScraper.java
+++ b/source/de/anomic/htmlFilter/htmlFilterContentScraper.java
@@ -485,10 +485,14 @@ public class htmlFilterContentScraper extends htmlFilterAbstractScraper implemen
         final byte[] page = serverFileUtils.read(file);
         if (page == null) throw new IOException("no content in file " + file.toString());
         
+        // scrape document to look up charset
+        final htmlFilterInputStream htmlFilter = new htmlFilterInputStream(new ByteArrayInputStream(page),"UTF-8",new yacyURL("http://localhost", null),null,false);
+        final String charset = htmlFilter.detectCharset();
+        
         // scrape content
         final htmlFilterContentScraper scraper = new htmlFilterContentScraper(new yacyURL("http://localhost", null));
         final Writer writer = new htmlFilterWriter(null, null, scraper, null, false);
-        serverFileUtils.copy(new ByteArrayInputStream(page), writer, Charset.forName("UTF-8"));
+        serverFileUtils.copy(new ByteArrayInputStream(page), writer, Charset.forName(charset));
         
         return scraper;
     }