2021-02-08 19:23:05 +03:00
|
|
|
"""
|
|
|
|
Implementation of the 'index' subcommand.
|
|
|
|
"""
|
2021-02-24 19:21:45 +03:00
|
|
|
import psutil
|
2021-02-08 19:23:05 +03:00
|
|
|
|
2021-04-16 15:20:09 +03:00
|
|
|
from nominatim.db import status
|
|
|
|
from nominatim.db.connection import connect
|
2021-02-08 19:23:05 +03:00
|
|
|
|
|
|
|
# Do not repeat documentation of subcommand classes.
|
|
|
|
# pylint: disable=C0111
|
|
|
|
# Using non-top-level imports to avoid eventually unused imports.
|
|
|
|
# pylint: disable=E0012,C0415
|
|
|
|
|
|
|
|
|
|
|
|
class UpdateIndex:
|
|
|
|
"""\
|
|
|
|
Reindex all new and modified data.
|
2021-10-12 00:27:38 +03:00
|
|
|
|
|
|
|
Indexing is the process of computing the address and search terms for
|
|
|
|
the places in the database. Every time data is added or changed, indexing
|
|
|
|
needs to be run. Imports and replication updates automatically take care
|
|
|
|
of indexing. For other cases, this function allows to run indexing manually.
|
2021-02-08 19:23:05 +03:00
|
|
|
"""
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def add_args(parser):
|
|
|
|
group = parser.add_argument_group('Filter arguments')
|
|
|
|
group.add_argument('--boundaries-only', action='store_true',
|
|
|
|
help="""Index only administrative boundaries.""")
|
|
|
|
group.add_argument('--no-boundaries', action='store_true',
|
|
|
|
help="""Index everything except administrative boundaries.""")
|
|
|
|
group.add_argument('--minrank', '-r', type=int, metavar='RANK', default=0,
|
|
|
|
help='Minimum/starting rank')
|
|
|
|
group.add_argument('--maxrank', '-R', type=int, metavar='RANK', default=30,
|
|
|
|
help='Maximum/finishing rank')
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def run(args):
|
|
|
|
from ..indexer.indexer import Indexer
|
2021-04-24 12:25:47 +03:00
|
|
|
from ..tokenizer import factory as tokenizer_factory
|
2021-02-08 19:23:05 +03:00
|
|
|
|
2021-04-24 12:25:47 +03:00
|
|
|
tokenizer = tokenizer_factory.get_tokenizer_for_db(args.config)
|
|
|
|
|
|
|
|
indexer = Indexer(args.config.get_libpq_dsn(), tokenizer,
|
2021-02-24 19:21:45 +03:00
|
|
|
args.threads or psutil.cpu_count() or 1)
|
2021-02-08 19:23:05 +03:00
|
|
|
|
|
|
|
if not args.no_boundaries:
|
|
|
|
indexer.index_boundaries(args.minrank, args.maxrank)
|
|
|
|
if not args.boundaries_only:
|
|
|
|
indexer.index_by_rank(args.minrank, args.maxrank)
|
|
|
|
|
|
|
|
if not args.no_boundaries and not args.boundaries_only \
|
|
|
|
and args.minrank == 0 and args.maxrank == 30:
|
2021-02-23 12:11:21 +03:00
|
|
|
with connect(args.config.get_libpq_dsn()) as conn:
|
|
|
|
status.set_indexed(conn, True)
|
2021-02-08 19:23:05 +03:00
|
|
|
|
|
|
|
return 0
|