#!/usr/bin/env python import rclexecm import rclexec1 import re import sys import os # Processing the output from unrtf class RTFProcessData: def __init__(self, em): self.em = em self.out = "" self.gothead = 0 self.patendhead = re.compile('''''') self.patcharset = re.compile('''^' + "\n" self.out += line + "\n" self.gothead = 1 elif not self.patcharset.search(line): self.out += line + "\n" else: self.out += line + "\n" def wrapData(self): return self.out class RTFFilter: def __init__(self, em): self.em = em def reset(self): pass def getCmd(self, fn): cmd = rclexecm.which("unrtf") if cmd: return ([cmd, "--nopict", "--html"], RTFProcessData(self.em)) else: return ([],None) if __name__ == '__main__': if not rclexecm.which("unrtf"): print("RECFILTERROR HELPERNOTFOUND antiword") sys.exit(1) proto = rclexecm.RclExecM() filter = RTFFilter(proto) extract = rclexec1.Executor(proto, filter) rclexecm.main(proto, extract)