diff --git a/cybertools/text/doc.py b/cybertools/text/doc.py index f29610b..d2bd619 100644 --- a/cybertools/text/doc.py +++ b/cybertools/text/doc.py @@ -1,29 +1,9 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.doc -""" -Searchable text support for MS Word (.doc) files. +"""Searchable text support for MS Word (.doc) files. This uses the wvware command to perform the extraction. - Based on code provided by zc.index and TextIndexNG3. - -$Id$ """ import os, sys diff --git a/cybertools/text/html.py b/cybertools/text/html.py index 1338681..3e4bdcd 100644 --- a/cybertools/text/html.py +++ b/cybertools/text/html.py @@ -1,25 +1,6 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.html -""" -Searchable text support for HTML files. - -$Id$ +"""Searchable text support for HTML files. """ import os, sys diff --git a/cybertools/text/interfaces.py b/cybertools/text/interfaces.py index c74d6ff..14e737e 100644 --- a/cybertools/text/interfaces.py +++ b/cybertools/text/interfaces.py @@ -1,25 +1,6 @@ -# -# Copyright (c) 2006 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.interfaces -""" -interface definitions for text transformations. - -$Id$ +"""interface definitions for text transformations. """ from zope.interface import Interface diff --git a/cybertools/text/mimetypes.py b/cybertools/text/mimetypes.py index 977415b..1f5ed30 100644 --- a/cybertools/text/mimetypes.py +++ b/cybertools/text/mimetypes.py @@ -1,25 +1,6 @@ -# -# Copyright (c) 2011 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.mimetypes -""" -Some mime types rules, redefined here for more specific assignments. - -$Id$ +"""Some mime types rules, redefined here for more specific assignments. """ extensions = { diff --git a/cybertools/text/ooffice.py b/cybertools/text/ooffice.py index a1b7228..810ab96 100644 --- a/cybertools/text/ooffice.py +++ b/cybertools/text/ooffice.py @@ -1,27 +1,8 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.ooffice -""" -Searchable text support for OpenOffice files. +"""Searchable text support for OpenOffice files. Based on code provided by zc.index and TextIndexNG3. - -$Id$ """ import os, sys diff --git a/cybertools/text/pdf.py b/cybertools/text/pdf.py index 55b9271..1ac20d8 100644 --- a/cybertools/text/pdf.py +++ b/cybertools/text/pdf.py @@ -1,29 +1,9 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.pdf -""" -Searchable text support for Portable Document Format (PDF) files. +"""Searchable text support for Portable Document Format (PDF) files. This uses the pdftotext command from xpdf to perform the extraction. - Based on code provided by zc.index and TextIndexNG3. - -$Id$ """ import os, sys diff --git a/cybertools/text/ppt.py b/cybertools/text/ppt.py index b45f9eb..1170541 100644 --- a/cybertools/text/ppt.py +++ b/cybertools/text/ppt.py @@ -1,30 +1,10 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.ppt -""" -Searchable text support for Portable Document Format (PDF) files. - -This uses the pdftotext command from xpdf to perform the extraction. -interface definitions for text transformations. +"""Searchable text support for PowerPoint (.ppt) files. +This uses the ppthtml command from PowerPoint to perform the extraction. +Note: ppthtml is no longer available on current Debian or Ubuntu versions. Based on code provided by zc.index and TextIndexNG3. - -$Id$ """ import os, sys diff --git a/cybertools/text/rtf.py b/cybertools/text/rtf.py index 0e46c94..ce057c8 100644 --- a/cybertools/text/rtf.py +++ b/cybertools/text/rtf.py @@ -1,29 +1,9 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.rtf -""" -Searchable text support for MS Word (.doc) files. +"""Searchable text support for MS Word (.doc) files. This uses the wvware command to perform the extraction. - Based on code provided by zc.index and TextIndexNG3. - -$Id$ """ import os, sys diff --git a/cybertools/text/tests.py b/cybertools/text/tests.py index e735450..c11e21e 100755 --- a/cybertools/text/tests.py +++ b/cybertools/text/tests.py @@ -10,6 +10,7 @@ from cybertools.text import pdf warnings.filterwarnings('ignore', category=ResourceWarning) + class Test(unittest.TestCase): "Basic tests for the text package." diff --git a/cybertools/text/xls.py b/cybertools/text/xls.py index b3c7ac6..82b2dc3 100644 --- a/cybertools/text/xls.py +++ b/cybertools/text/xls.py @@ -1,29 +1,9 @@ -# -# Copyright (c) 2007 Helmut Merz helmutm@cy55.de -# -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 2 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA -# +# cybertools.text.xls -""" -Searchable text support for MS Excel (.xls) files. +"""Searchable text support for MS Excel (.xls) files. This uses the xls2csv command to perform the extraction. - Based on code provided by zc.index and TextIndexNG3. - -$Id$ """ import os, sys