tools/search.py
author Tero Marttila <terom@fixme.fi>
Mon, 09 Feb 2009 11:46:17 +0200
changeset 65 8b50694f841e
child 68 8157c41b3236
permissions -rw-r--r--
improve search further
65
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     1
"""
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     2
    Tool for accessing the search index
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     3
"""
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     4
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     5
import sys; sys.path.insert(0, '.'); sys.path.insert(0, '..')
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     6
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     7
import datetime, pytz
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     8
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     9
import log_search
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    10
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    11
def cmd_load (options, channel_name, *dates) :
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    12
    """
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    13
        Loads the logs for a specific channel for the given dates into the index
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    14
    """
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    15
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    16
    import channels
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    17
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    18
    # open the LogSearchIndex
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    19
    index = log_search.LogSearchIndex(options.index_path, '*' if options.create_index else 'a')
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    20
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    21
    # open the channel
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    22
    channel = channels.channel_list.lookup(channel_name)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    23
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    24
    for date_name in dates :
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    25
        # parse date
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    26
        date = datetime.datetime.strptime(date_name, '%Y-%m-%d').replace(tzinfo=channel.source.tz)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    27
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    28
        print "%s..." % (date, )
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    29
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    30
        # load lines for date
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    31
        lines = channel.source.get_date(date)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    32
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    33
        # insert
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    34
        index.insert(channel, lines)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    35
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    36
def cmd_search (options, channel_name, query) :
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    37
    """
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    38
        Search the index for events on a specific channel with the given query
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    39
    """
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    40
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    41
    import channels
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    42
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    43
    assert not options.create_index
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    44
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    45
    # open the LogSearchIndex
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    46
    index = log_search.LogSearchIndex(options.index_path, 'r')
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    47
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    48
    # open the channel
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    49
    channel = channels.channel_list.lookup(channel_name)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    50
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    51
    # search
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    52
    lines = index.search_simple(channel, query)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    53
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    54
    # display as plaintext
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    55
    for line in options.formatter.format_txt(lines) :
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    56
        print line
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    57
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    58
if __name__ == '__main__' :
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    59
    from optparse import OptionParser
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    60
    import log_formatter
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    61
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    62
    # define parser
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    63
    parser = OptionParser(
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    64
        usage           = "%prog [options] <command> [ ... ]",
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    65
        add_help_option = True,
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    66
    )
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    67
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    68
    # define command-line arguments
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    69
    parser.add_option("-I", "--index", dest="index_path", help="Index database path", metavar="PATH", default="logs/index")
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    70
    parser.add_option("--create", dest="create_index", help="Create index database", default=False)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    71
    parser.add_option("-f", "--formatter", dest="formatter_name", help="LogFormatter to use", default="irssi")
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    72
    parser.add_option("-z", "--timezone", dest="tz_name", help="Timezone for output", metavar="TZ", default="UTC")
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    73
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    74
    # parse
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    75
    options, args = parser.parse_args()
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    76
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    77
    # postprocess stuff
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    78
    options.tz = pytz.timezone(options.tz_name)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    79
    options.formatter = log_formatter.by_name(options.formatter_name)(options.tz)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    80
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    81
    # pop command
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    82
    command = args.pop(0)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    83
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    84
    # inspect
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    85
    func = globals()['cmd_%s' % command]
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    86
    
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    87
    # call
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    88
    func(options, *args)
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    89
8b50694f841e improve search further
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    90