#scraper/replacements/encoding.txt # --- fix common encoding artifacts --- \u3000= # IDEOGRAPHIC SPACE → empty \u00A0= # non-breaking space → empty # full-width punctuation ,=, 。=. !=! ?=? ;=; :=: (=( )=) 【=[ 】=] 《=< 》=> # hyphen variants –=- —=- ―=- \u3000= \u00A0=  =  = = —=— “=" ”=" ’=' …=… •=* ▁= ▲=  =