# This patch file, files created by its use and not subject to other copyright # and any changes in other files generated by its use are # Copyright (C) 2000-2003 by the Free Software Foundation, Inc. # 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA # This patch file is Free Software and permission is granted to copy and # redistribute it in original or modified form under the terms of the # GNU General Public License (GPL). # See the GPL COPYING files accompanying Mailman distributions this # patch was intended to work in conjunction with for further details. diff -r -u -P mailman-2.1.3/Mailman/Archiver/HyperArch.py mailman-2.1.3-index/Mailman/Archiver/HyperArch.py --- mailman-2.1.3/Mailman/Archiver/HyperArch.py Mon Sep 22 03:40:51 2003 +++ mailman-2.1.3-index/Mailman/Archiver/HyperArch.py Mon Sep 29 16:33:20 2003 @@ -447,6 +447,8 @@ d['listurl'] = self._mlist.GetScriptURL('listinfo', absolute=1) d['listname'] = self._mlist.real_name d['encoding'] = '' + d["indexing_enable"] = mm_cfg.ARCHIVE_INDEXING_ENABLE + d["indexing_disable"] = mm_cfg.ARCHIVE_INDEXING_DISABLE finally: i18n.set_translation(otrans) @@ -638,6 +640,8 @@ "archivedate": quotetime(self.archivedate), "listinfo": mlist.GetScriptURL('listinfo', absolute=1), "version": self.version, + "indexing_enable": mm_cfg.ARCHIVE_INDEXING_ENABLE, + "indexing_disable": mm_cfg.ARCHIVE_INDEXING_DISABLE, } i = {"thread": _("thread"), "subject": _("subject"), @@ -674,6 +678,8 @@ "firstdate": quotetime(self.firstdate), "lastdate": quotetime(self.lastdate), "size": self.size, + "indexing_enable": mm_cfg.ARCHIVE_INDEXING_ENABLE, + "indexing_disable": mm_cfg.ARCHIVE_INDEXING_DISABLE, } i = {"thread": _("thread"), "subject": _("subject"), @@ -708,6 +714,8 @@ "fullarch": '../%s.mbox/%s.mbox' % (listname, listname), "size": sizeof(mbox, mlist.preferred_language), 'meta': '', + "indexing_enable": mm_cfg.ARCHIVE_INDEXING_ENABLE, + "indexing_disable": mm_cfg.ARCHIVE_INDEXING_DISABLE, } # Avoid i18n side-effects otrans = i18n.get_translation() @@ -773,7 +781,9 @@ 'archtocentry.html', {'archive': arch, 'archivelabel': self.volNameToDesc(arch), - 'textlink': textlink + 'textlink': textlink, + 'indexing_enable': mm_cfg.ARCHIVE_INDEXING_ENABLE, + 'indexing_disable': mm_cfg.ARCHIVE_INDEXING_DISABLE, }, mlist=self.maillist) diff -r -u -P mailman-2.1.3/Mailman/Defaults.py.in mailman-2.1.3-index/Mailman/Defaults.py.in --- mailman-2.1.3/Mailman/Defaults.py.in Mon Sep 22 05:26:14 2003 +++ mailman-2.1.3-index/Mailman/Defaults.py.in Mon Sep 29 16:33:20 2003 @@ -1243,6 +1243,23 @@ # Import a bunch of version numbers from Version import * +# Strings for wrapping html stuff we do not want a search engine to +# pay attention to in the pipermail archives. Of course the search engine +# must be able to interpret such strings. +ARCHIVE_INDEXING_ENABLE = '' +ARCHIVE_INDEXING_DISABLE = '' +# For example, you could insert the following into your mm_cfg if you +# were using htdig for searching archives. They are default values for +# htdig config attributes noindex_end and noindex_start respectively +#ARCHIVE_INDEXING_ENABLE = '' +#ARCHIVE_INDEXING_DISABLE = '' +# You can also cater for controlling multiple search engines that +# recognise different tags to control what they should add to their +# indexes by putting the tags recognised by each search engine +# into the strings. For instance: +#ARCHIVE_INDEXING_ENABLE = '\n' +#ARCHIVE_INDEXING_DISABLE = '\n' + # Vgg: Language descriptions and charsets dictionary, any new supported # language must have a corresponding entry here. Key is the name of the # directories that hold the localized texts. Data are tuples with first diff -r -u -P mailman-2.1.3/README.NOINDEXtags mailman-2.1.3-index/README.NOINDEXtags --- mailman-2.1.3/README.NOINDEXtags Thu Jan 1 01:00:00 1970 +++ mailman-2.1.3-index/README.NOINDEXtags Mon Sep 29 16:33:20 2003 @@ -0,0 +1,29 @@ +If you are defining values for the ARCHIVE_INDEXING_ENABLE and +ARCHIVE_INDEXING_DISABLE configuration attributes in MM_cfg.py you +may want to try and control the indexing activities of multiple search +engines that you let access your mail archives. + +At the time of writing this, the problem you face is that there is no standard +tag defined to exert partial control over search engine indexing of a page. By +this I mean a way of telling the search engine to index only a specified part of +the page content. There is no formal or de facto standard equivalent to the +robot property on the HTML 4.0 META tag e.g. +, +which gives whole page control with most search engines. + +However, you should be able to put multiple start and stop indexing tags in the +values you assign to the ARCHIVE_INDEXING_ENABLE/DISABLE strings in mm_cfg.py. + +For example, some writers on the web suggest using and tags +because they are recognised and honoured by a number of search engines. + +The defaults recognised by htdig are actually HTML comments of the form + and . + +You could combine these in your mm_cfg.py file as follows: + +ARCHIVE_INDEXING_ENABLE = '\n' +ARCHIVE_INDEXING_DISABLE = '\n' + +Most browsers and search engines should be happy with the results of this as, in +general, they will ignore tags they do not understand and act on those they do. diff -r -u -P mailman-2.1.3/templates/cs/article.html mailman-2.1.3-index/templates/cs/article.html --- mailman-2.1.3/templates/cs/article.html Fri Dec 13 18:13:43 2002 +++ mailman-2.1.3-index/templates/cs/article.html Mon Sep 29 16:33:20 2003 @@ -12,6 +12,7 @@

%(subject_html)s

+%(indexing_disable)s %(author_html)s %(email_html)s @@ -28,9 +29,11 @@
+%(indexing_enable)s %(body)s +%(indexing_disable)s


Dal informace o konferenci %(listname)s
+%(indexing_enable)s diff -r -u -P mailman-2.1.3/templates/da/archidxfoot.html mailman-2.1.3-index/templates/da/archidxfoot.html --- mailman-2.1.3/templates/da/archidxfoot.html Mon Sep 22 04:52:33 2003 +++ mailman-2.1.3-index/templates/da/archidxfoot.html Mon Sep 29 16:33:20 2003 @@ -1,3 +1,4 @@ +%(indexing_disable)s

Dato på nyeste meddelelse: @@ -17,5 +18,6 @@


Dette arkiv blev genereret af Pipermail %(version)s. +%(indexing_enable)s diff -r -u -P mailman-2.1.3/templates/da/archidxhead.html mailman-2.1.3-index/templates/da/archidxhead.html --- mailman-2.1.3/templates/da/archidxhead.html Mon Sep 22 04:52:33 2003 +++ mailman-2.1.3-index/templates/da/archidxhead.html Mon Sep 29 16:33:20 2003 @@ -6,6 +6,7 @@ %(encoding)s +%(indexing_disable)s

Arkivet for %(archive)s sortert efter %(archtype)s

+%(indexing_disable)s +

Last message date: %(lastdate)s
@@ -17,5 +18,6 @@


This archive was generated by Pipermail %(version)s. +%(indexing_enable)s diff -r -u -P mailman-2.1.3/templates/en/archidxhead.html mailman-2.1.3-index/templates/en/archidxhead.html --- mailman-2.1.3/templates/en/archidxhead.html Tue Oct 8 17:50:41 2002 +++ mailman-2.1.3-index/templates/en/archidxhead.html Mon Sep 29 16:33:20 2003 @@ -6,7 +6,8 @@ %(encoding)s - +%(indexing_disable)s +

%(archive)s Archives by %(archtype)s


+%(indexing_enable)s %(body)s +%(indexing_disable)s


%(listname)s info
+%(indexing_enable)s diff -r -u -P mailman-2.1.3/templates/eu/archidxfoot.html mailman-2.1.3-index/templates/eu/archidxfoot.html --- mailman-2.1.3/templates/eu/archidxfoot.html Mon Sep 22 04:52:34 2003 +++ mailman-2.1.3-index/templates/eu/archidxfoot.html Mon Sep 29 16:33:20 2003 @@ -1,3 +1,4 @@ +%(indexing_disable)s

Azken mezuaren data: @@ -17,5 +18,6 @@


Pipermail %(version)s-ak sortu du fitxategi hau. +%(indexing_enable)s - \ No newline at end of file + diff -r -u -P mailman-2.1.3/templates/eu/archidxhead.html mailman-2.1.3-index/templates/eu/archidxhead.html --- mailman-2.1.3/templates/eu/archidxhead.html Mon Sep 22 04:52:34 2003 +++ mailman-2.1.3-index/templates/eu/archidxhead.html Mon Sep 29 16:33:20 2003 @@ -6,6 +6,7 @@ %(encoding)s +%(indexing_disable)s

%(archive)s Archives by %(archtype)s