ExternalDocument.py 2.5 KB
Newer Older
Jean-Paul Smets's avatar
Jean-Paul Smets committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
##############################################################################
#
# Copyright (c) 2006-2007 Nexedi SARL and Contributors. All Rights Reserved.
#
# WARNING: This program as such is intended to be used by professional
# programmers who take the whole responsability of assessing all potential
# consequences resulting from its eventual inadequacies and bugs
# End users who are looking for a ready-to-use solution with commercial
# garantees and support are strongly adviced to contract a Free Software
# Service Company
#
# This program is Free Software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
#
##############################################################################
Jean-Paul Smets's avatar
Jean-Paul Smets committed
27 28 29

class ExternalDocument:
  """
Jean-Paul Smets's avatar
Jean-Paul Smets committed
30 31 32
  Properties of documents which have been downloaded from a URL. Most
  properties are used by the crawling API to frequently update content
  if necessary.
Jean-Paul Smets's avatar
Jean-Paul Smets committed
33 34
  """
  _properties = (
Jean-Paul Smets's avatar
Jean-Paul Smets committed
35 36 37 38
        {   'id'          : 'crawling_cache_duration',
            'description' : 'Defines the number of day a document should be kept in'
                            'public cache after it has disappeared from the Web.',
            'default'     : 10,
Jean-Paul Smets's avatar
Jean-Paul Smets committed
39 40
            'type'        : 'int',
            'mode'        : 'w'},
Jean-Paul Smets's avatar
Jean-Paul Smets committed
41 42 43
        {   'id'          : 'crawling_depth',
            'description' : 'Defines the maximum number of links which can be followed in the'
                            'crawling process. If set to 0 (default), no crawling happens.',
Jean-Paul Smets's avatar
Jean-Paul Smets committed
44
            'type'        : 'int',
Jean-Paul Smets's avatar
Jean-Paul Smets committed
45 46
            'default'     : 0,
            'mode'        : 'w'},
47
        {   'id'          : 'crawling_scope',
Jean-Paul Smets's avatar
Jean-Paul Smets committed
48 49 50
            'description' : 'Defines whether the crawling process should be local to a single'
                            'domain or IP host. If so, crawling will not try to access'
                            'links outside the initial host.',
51
            'type'        : 'string',
Jean-Paul Smets's avatar
Jean-Paul Smets committed
52 53
            'mode'        : 'w'},
        )