# This patch file, files created by its use and not subject to other copyright
# and any changes in other files generated by its use are
# Copyright (C) 2000-2003 by the Free Software Foundation, Inc.
# 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA
# This patch file is Free Software and permission is granted to copy and
# redistribute it in original or modified form under the terms of the
# GNU General Public License (GPL).
# See the GPL COPYING files accompanying Mailman distributions this
# patch was intended to work in conjunction with for further details.
diff -r -u -P mailman-2.1.3/Mailman/Archiver/HyperArch.py mailman-2.1.3-index/Mailman/Archiver/HyperArch.py
--- mailman-2.1.3/Mailman/Archiver/HyperArch.py Mon Sep 22 03:40:51 2003
+++ mailman-2.1.3-index/Mailman/Archiver/HyperArch.py Mon Sep 29 16:33:20 2003
@@ -447,6 +447,8 @@
d['listurl'] = self._mlist.GetScriptURL('listinfo', absolute=1)
d['listname'] = self._mlist.real_name
d['encoding'] = ''
+ d["indexing_enable"] = mm_cfg.ARCHIVE_INDEXING_ENABLE
+ d["indexing_disable"] = mm_cfg.ARCHIVE_INDEXING_DISABLE
finally:
i18n.set_translation(otrans)
@@ -638,6 +640,8 @@
"archivedate": quotetime(self.archivedate),
"listinfo": mlist.GetScriptURL('listinfo', absolute=1),
"version": self.version,
+ "indexing_enable": mm_cfg.ARCHIVE_INDEXING_ENABLE,
+ "indexing_disable": mm_cfg.ARCHIVE_INDEXING_DISABLE,
}
i = {"thread": _("thread"),
"subject": _("subject"),
@@ -674,6 +678,8 @@
"firstdate": quotetime(self.firstdate),
"lastdate": quotetime(self.lastdate),
"size": self.size,
+ "indexing_enable": mm_cfg.ARCHIVE_INDEXING_ENABLE,
+ "indexing_disable": mm_cfg.ARCHIVE_INDEXING_DISABLE,
}
i = {"thread": _("thread"),
"subject": _("subject"),
@@ -708,6 +714,8 @@
"fullarch": '../%s.mbox/%s.mbox' % (listname, listname),
"size": sizeof(mbox, mlist.preferred_language),
'meta': '',
+ "indexing_enable": mm_cfg.ARCHIVE_INDEXING_ENABLE,
+ "indexing_disable": mm_cfg.ARCHIVE_INDEXING_DISABLE,
}
# Avoid i18n side-effects
otrans = i18n.get_translation()
@@ -773,7 +781,9 @@
'archtocentry.html',
{'archive': arch,
'archivelabel': self.volNameToDesc(arch),
- 'textlink': textlink
+ 'textlink': textlink,
+ 'indexing_enable': mm_cfg.ARCHIVE_INDEXING_ENABLE,
+ 'indexing_disable': mm_cfg.ARCHIVE_INDEXING_DISABLE,
},
mlist=self.maillist)
diff -r -u -P mailman-2.1.3/Mailman/Defaults.py.in mailman-2.1.3-index/Mailman/Defaults.py.in
--- mailman-2.1.3/Mailman/Defaults.py.in Mon Sep 22 05:26:14 2003
+++ mailman-2.1.3-index/Mailman/Defaults.py.in Mon Sep 29 16:33:20 2003
@@ -1243,6 +1243,23 @@
# Import a bunch of version numbers
from Version import *
+# Strings for wrapping html stuff we do not want a search engine to
+# pay attention to in the pipermail archives. Of course the search engine
+# must be able to interpret such strings.
+ARCHIVE_INDEXING_ENABLE = ''
+ARCHIVE_INDEXING_DISABLE = ''
+# For example, you could insert the following into your mm_cfg if you
+# were using htdig for searching archives. They are default values for
+# htdig config attributes noindex_end and noindex_start respectively
+#ARCHIVE_INDEXING_ENABLE = ''
+#ARCHIVE_INDEXING_DISABLE = ''
+# You can also cater for controlling multiple search engines that
+# recognise different tags to control what they should add to their
+# indexes by putting the tags recognised by each search engine
+# into the strings. For instance:
+#ARCHIVE_INDEXING_ENABLE = '\n'
+#ARCHIVE_INDEXING_DISABLE = '\n'
+
# Vgg: Language descriptions and charsets dictionary, any new supported
# language must have a corresponding entry here. Key is the name of the
# directories that hold the localized texts. Data are tuples with first
diff -r -u -P mailman-2.1.3/README.NOINDEXtags mailman-2.1.3-index/README.NOINDEXtags
--- mailman-2.1.3/README.NOINDEXtags Thu Jan 1 01:00:00 1970
+++ mailman-2.1.3-index/README.NOINDEXtags Mon Sep 29 16:33:20 2003
@@ -0,0 +1,29 @@
+If you are defining values for the ARCHIVE_INDEXING_ENABLE and
+ARCHIVE_INDEXING_DISABLE configuration attributes in MM_cfg.py you
+may want to try and control the indexing activities of multiple search
+engines that you let access your mail archives.
+
+At the time of writing this, the problem you face is that there is no standard
+tag defined to exert partial control over search engine indexing of a page. By
+this I mean a way of telling the search engine to index only a specified part of
+the page content. There is no formal or de facto standard equivalent to the
+robot property on the HTML 4.0 META tag e.g.
+,
+which gives whole page control with most search engines.
+
+However, you should be able to put multiple start and stop indexing tags in the
+values you assign to the ARCHIVE_INDEXING_ENABLE/DISABLE strings in mm_cfg.py.
+
+For example, some writers on the web suggest using and tags
+because they are recognised and honoured by a number of search engines.
+
+The defaults recognised by htdig are actually HTML comments of the form
+ and .
+
+You could combine these in your mm_cfg.py file as follows:
+
+ARCHIVE_INDEXING_ENABLE = '\n'
+ARCHIVE_INDEXING_DISABLE = '\n'
+
+Most browsers and search engines should be happy with the results of this as, in
+general, they will ignore tags they do not understand and act on those they do.
diff -r -u -P mailman-2.1.3/templates/cs/article.html mailman-2.1.3-index/templates/cs/article.html
--- mailman-2.1.3/templates/cs/article.html Fri Dec 13 18:13:43 2002
+++ mailman-2.1.3-index/templates/cs/article.html Mon Sep 29 16:33:20 2003
@@ -12,6 +12,7 @@