[Erp5-report] r9078 - /erp5/trunk/utils/ooodoc_server/worker.py
nobody at svn.erp5.org
nobody at svn.erp5.org
Mon Aug 7 18:42:36 CEST 2006
Author: bartek
Date: Mon Aug 7 18:42:28 2006
New Revision: 9078
URL: http://svn.erp5.org?rev=9078&view=rev
Log:
fixed text extraction from html
Modified:
erp5/trunk/utils/ooodoc_server/worker.py
Modified: erp5/trunk/utils/ooodoc_server/worker.py
URL: http://svn.erp5.org/erp5/trunk/utils/ooodoc_server/worker.py?rev=9078&r1=9077&r2=9078&view=diff
==============================================================================
--- erp5/trunk/utils/ooodoc_server/worker.py (original)
+++ erp5/trunk/utils/ooodoc_server/worker.py Mon Aug 7 18:42:28 2006
@@ -28,7 +28,6 @@
##############################################################################
import os,sys,pdb,time, formatter, htmllib
-sys.path.append('/etc/ooodoc')
import config
sys.path.append(config.unopath)
import uno
@@ -55,11 +54,11 @@
def do_meta(self,tag):
t=dict(tag)
if t.get('name','x').lower() in ('keywords','description'):
- print t['content']
+ self.formatter.add_flowing_data(t['content'])
def feed(self,s):
- htmllib.HTMLParser(self,s)
- print s.title
+ htmllib.HTMLParser.feed(self,s)
+ self.formatter.add_flowing_data(self.title)
class HTMLStripper(object):
More information about the Erp5-report
mailing list