#!/usr/bin/env python import sys, re r_hibytes = re.compile(r'[\x80-\xff]+') input = sys.stdin.read() for hibytes in r_hibytes.findall(input): print hibytes