summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorAdmin <admin@marx.cafe>2022-11-28 01:21:47 -0500
committerAdmin <admin@marx.cafe>2022-11-28 01:21:47 -0500
commit33a6f6db56055d58ee2d24262c4a9abdccdb9679 (patch)
treefa90bf68c470efddfd48d2e2b57c98ac38647873
parentee1101e85cfa178444324e1826ab60969b52969d (diff)
Replace invalid utf-8 characters in html2md
-rwxr-xr-xhtml2md.rb2
1 files changed, 1 insertions, 1 deletions
diff --git a/html2md.rb b/html2md.rb
index 0ba7f55..404fbde 100755
--- a/html2md.rb
+++ b/html2md.rb
@@ -16,7 +16,7 @@ end
filename = ARGV[0]
file_no_ext = File.basename(filename, File.extname(filename))
-content = File.read(filename)
+content = File.read(filename).encode('UTF-8', invalid: :replace, undef: :replace)
doc = Nokogiri.parse(content)
title = doc.title