diff options
author | Joseph Graham <joseph@fibreglass.tunachunks> | 2013-09-07 19:10:32 +0100 |
---|---|---|
committer | Joseph Graham <joseph@fibreglass.tunachunks> | 2013-09-07 19:10:32 +0100 |
commit | c1c6c64ccc59e8fd9d6eed2f42349cc4ede30067 (patch) | |
tree | 81c2f99c49051efa2a927a32754bd00a43145d4e | |
parent | b51e31f9bb102ca5b4ae609a4424a54e7063d794 (diff) |
my attempt at fixing the bot's ability to process utf-8 in page titles
-rw-r--r-- | common_codez | 5 |
1 files changed, 4 insertions, 1 deletions
diff --git a/common_codez b/common_codez index 5f4b845..33a2f01 100644 --- a/common_codez +++ b/common_codez @@ -2,5 +2,8 @@ function replace_wierd_html_chars { - w3m -dump -T text/html -cols 9999 + #w3m -dump -T text/html -cols 9999 + + # Let's see if this new code works better + recode html..utf-8 } |