[Erp5-report] r9078 - /erp5/trunk/utils/ooodoc_server/worker.py

nobody at svn.erp5.org nobody at svn.erp5.org
Mon Aug 7 18:42:36 CEST 2006


Author: bartek
Date: Mon Aug  7 18:42:28 2006
New Revision: 9078

URL: http://svn.erp5.org?rev=9078&view=rev
Log:
fixed text extraction from html

Modified:
    erp5/trunk/utils/ooodoc_server/worker.py

Modified: erp5/trunk/utils/ooodoc_server/worker.py
URL: http://svn.erp5.org/erp5/trunk/utils/ooodoc_server/worker.py?rev=9078&r1=9077&r2=9078&view=diff
==============================================================================
--- erp5/trunk/utils/ooodoc_server/worker.py (original)
+++ erp5/trunk/utils/ooodoc_server/worker.py Mon Aug  7 18:42:28 2006
@@ -28,7 +28,6 @@
 ##############################################################################
 
 import os,sys,pdb,time, formatter, htmllib
-sys.path.append('/etc/ooodoc')
 import config
 sys.path.append(config.unopath)
 import uno
@@ -55,11 +54,11 @@
   def do_meta(self,tag):
     t=dict(tag)
     if t.get('name','x').lower() in ('keywords','description'):
-      print t['content']
+      self.formatter.add_flowing_data(t['content'])
 
   def feed(self,s):
-    htmllib.HTMLParser(self,s)
-    print s.title
+    htmllib.HTMLParser.feed(self,s)
+    self.formatter.add_flowing_data(self.title)
 
 
 class HTMLStripper(object):




More information about the Erp5-report mailing list