[IMP] document :- support indexation of .docx to text and PPTX to html

bzr revid: ysa@tinyerp.co.in-20100311085600-4t4gmuzywglpugh0
2010-03-11 14:26:00 +05:30 · 2010-03-11 14:26:00 +05:30 · d217272611
parent e7fb07589f
commit d217272611
1 changed files with 16 additions and 3 deletions
--- a/addons/document/std_index.py
+++ b/addons/document/std_index.py
@ -21,7 +21,7 @@

 import StringIO
 import odt2txt
-
+from subprocess import Popen, PIPE
 from content_index import indexer, cntIndex


@ -50,15 +50,28 @@ class TxtIndex(indexer):
        
 cntIndex.register(TxtIndex())

+class PptIndex(indexer):
+    def _getMimeTypes(self):
+        return [ 'application/ms-word']
+    
+    def _getExtensions(self):
+        return ['.ppt','.pptx']
+
+    def _doIndexFile(self,fname):
+        fp = Popen(['ppthtml', fname], shell=False, stdout=PIPE).stdout
+        return _to_unicode( fp.read())
+
+cntIndex.register(PptIndex())
+
 class DocIndex(indexer):
    def _getMimeTypes(self):
        return [ 'application/ms-word']
    
    def _getExtensions(self):
-        return ['.doc']
+        return ['.doc','.docx']

    def _doIndexFile(self,fname):
-        fp = Popen(['antiword',fname], shell=False, stdout=PIPE).stdout
+        fp = Popen(['antiword', fname], shell=False, stdout=PIPE).stdout
        return _to_unicode( fp.read())

 cntIndex.register(DocIndex())