GrafeasGroup · codingJWilliams · May 13, 2018 · May 13, 2018 · May 13, 2018 · May 13, 2018
diff --git a/tor_ocr/main.py b/tor_ocr/main.py
@@ -165,10 +165,27 @@ def decode_image_from_url(url, overlay=False, api_key=__OCR_API_KEY__):
         raise ConnectionError(
             'Attempted all three OCR.space APIs -- cannot connect!'
         )
-
     return result.json()
 
 
+def clean_formatting(body):
+  """ Returns a version of the input body with the formatting stripped """
+  snoodown_chars = [ '>', '~', '*', '_', '#', '^', '+', '-', '`', '|']
+  body = body.replace(
+            '\r\n', '\n\n'
+        ).replace(
+            '/u/', '\\/u/'
+        ).replace(
+            '/r/', '\\/r/'
+        ).replace(
+            ' u/', ' \\/u/'
+        ).replace(
+            ' r/', ' \\/r/'
+        )
+  for escape_char in snoodown_chars:
+        body = body.replace(escape_char, '\\' + escape_char)
+  return body
+
 # noinspection PyShadowingNames
 def run(config):
     time.sleep(config.ocr_delay)
@@ -220,19 +237,7 @@ def run(config):
         # should post a top level comment, then keep replying to
         # the comments we make until we run out of chunks.
 
-        chunk = chunk.replace(
-            '\r\n', '\n\n'
-        ).replace(
-            '/u/', '\\/u/'
-        ).replace(
-            '/r/', '\\/r/'
-        ).replace(
-            ' u/', ' \\/u/'
-        ).replace(
-            ' r/', ' \\/r/'
-        ).replace(
-            '>>', '\>\>'
-        )
+        chunk = clean_formatting(chunk)
 
         thing_to_reply_to = thing_to_reply_to.reply(_(chunk))