summaryrefslogtreecommitdiff
path: root/archivist/cli.py
blob: 5085ab725385d99ade7b89d5bb567e0a7c14ff80 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
import click
from functools import reduce
import operator as op

from .prefixes import query_pseudo_prefix, is_pseudo_prefix

CONTEXT_SETTINGS = dict(help_option_names=['-h', '--help'])

def enable_debug():
    import logging
    logger = logging.getLogger('peewee')
    logger.setLevel(logging.DEBUG)
    logger.addHandler(logging.StreamHandler())

@click.group(context_settings = CONTEXT_SETTINGS)
@click.option('--debug', '-d', is_flag=True, default=False)
def cli(debug):
    if debug: enable_debug()

@cli.group()
def db():
    """Database Management"""
    pass

@db.command()
def init():
    """Initialize the database, if not done already."""
    from .model import create_tables, db
    from .prefixes import register_prefixes
    create_tables()
    with db.atomic():
        register_prefixes()

@db.command()
@click.confirmation_option(prompt="Are you sure you want to drop the database?")
def drop():
    """Completely drop all tables."""
    from .model import drop_tables
    drop_tables()

@cli.group()
def tag():
    """Handling of tags"""
    pass

@cli.group()
def prefix():
    """Handling of prefixes of tags"""
    pass

@tag.command('list')
@click.argument('pattern', required = False)
def list_tags(pattern):
    from .model import Tag

    print("Tags")
    print("====")
    print()

    query = Tag.select().where(~Tag.default)

    if pattern:
        query = query.where(Tag.name.contains(pattern) | Tag.prefix.contains(pattern))

    for t in query:
        descr = t.description or ''
        if descr:
            descr = '-- ' + descr
        print(' *', t, descr)

@prefix.command('list')
def list_prefixes():
    from .model import Prefix
    
    print("Prefixes")
    print("========")
    print()

    for p in Prefix.select():
        print("  * %s" % p)

@prefix.command('add')
@click.argument('name')
@click.argument('description', required = False)
def add_prefix(name, description):
    from .model import Prefix

    prefix = Prefix.try_create(name = name, description = description)
    if prefix is None:
        print("Prefix already existed:", name)

def prefix_tag_name(name, prefix=None):
    if prefix:
        return "%s:%s" % (prefix, name)
    else:
        return name

class PrefixTag:
    def __init__(self, tag, prefix = None):
        self.tag = tag
        self.prefix = prefix

    def __str__(self):
        if self.prefix:
            return '%s:%s' % (self.prefix, self.tag)
        else:
            return self.tag

    def __iter__(self):
        yield self.prefix
        yield self.tag

    def prefixed_name(self):
        return prefix_tag_name(self.tag, self.prefix)

    def is_virtual(self):
        return self.prefix and is_pseudo_prefix(self.prefix)

    @property
    def virtual_query(self):
        return query_pseudo_prefix(self.prefix, self.tag)

    def __str__(self):
        return self.prefixed_name()

class PrefixTagType(click.ParamType):
    name = 'prefixed tag'

    def convert(self, value, param, ctx):
        try:
            prefix, tag = value.split(':', 1)
        except ValueError:
            return PrefixTag(value)
        return PrefixTag(tag, prefix)

TAG = PrefixTagType()

@prefix.command('edit')
@click.argument('name')
@click.argument('implies', type = TAG, nargs = -1)
@click.option('--description')
def edit_prefix(name, implies, description):
    from .model import Prefix, db

    try:
        prefix = Prefix.get(name = name)
    except Prefix.DoesNotExist:
        raise click.UsageError("Prefix '%s' does not exist." % name)

    with db.atomic():
        add_implications(prefix.default_tag, implies)
        if description:
            prefix.description = description
            prefix.save()


def create_tag(name, description=None):
    from .model import Tag, TagImplications, Prefix, db

    with db.atomic():
        if name.prefix:
            prefix, created = Prefix.get_or_create(name = name.prefix)

            if not created and prefix.virtual:
                raise click.UsageError("Prefix '%s' is not allowed to carry additional tags." % name.prefix)
        else:
            prefix = None

        tag, created = Tag.create_or_get(name = name.tag, prefix = prefix, description = description)

        if prefix is not None:
            TagImplications.try_create(tag = tag, implies_tag = prefix.default_tag)

        return tag, created

def fetch_tags(tag_list, ignore_missing=False):
    if not tag_list:
        return []

    from .model import Tag
    from .peewee_ext import sqlite_tuple_in

    fetched_tags = Tag.select().where(sqlite_tuple_in((Tag.prefix, Tag.name), tag_list)).execute()
    if len(fetched_tags) < len(tag_list):
        print("Some tags were not present:", ', '.join(set(map(str, tag_list)).difference(map(str, fetched_tags))))
        if not ignore_missing:
            raise click.ClickException("Not all tags present")

    return fetched_tags

@tag.command('add')
@click.argument('name', type = TAG)
@click.argument('description', required = False)
def add_tag(name, description):
    tag, created = create_tag(name, description)
    if not created:
        print("Tag already existed:", tag)

def add_implications(tag, implies):
    from .model import TagImplications
    from peewee import IntegrityError

    for i in fetch_tags(implies):
        try:
            TagImplications.create(tag = tag, implies_tag = i)
        except IntegrityError:
            print("Implication onto '%s' already existing. Skipping." % i)

@tag.command('edit')
@click.argument('name', type = TAG)
@click.argument('implies', type = TAG, nargs = -1)
@click.option('--description')
def edit_tag(name, implies, description):
    from .model import Tag, db

    try:
        tag = Tag.get(name = name.tag, prefix = name.prefix)
    except Tag.DoesNotExist:
        raise click.UsageError("Tag '%s' does not exist." % name)

    with db.atomic():
        add_implications(tag, implies)
        if description:
            tag.description = description
            tag.save()

@cli.group()
def doc():
    """Document handling"""
    pass

@doc.command('add')
@click.argument('file', type=click.File(mode = 'rb'))
@click.argument('tags', type=TAG, nargs=-1)
@click.option('--create-tags', '-c', is_flag = True)
@click.option('--ignore-missing-tags', '-i', is_flag = True)
def add_doc(file, tags, create_tags, ignore_missing_tags):
    """Add a new document together with the given tags."""

    from .model import Document, Tag, db, DocumentTag
    import magic

    with db.atomic():
        if tags:
            if create_tags:
                tags = [create_tag(tag)[0] for tag in tags]
            else:
                tags = fetch_tags(tags, ignore_missing_tags)

        mimetype = magic.from_file(file.name, mime=True)

        doc = Document.create(content = file.read(),
                file_type = mimetype,
                original_path = file.name,
                direction = Document.Direction.IN)

        for t in tags:
            DocumentTag.create(document = doc, tag = t)

@doc.command('find')
@click.argument('tags', type=TAG, nargs=-1)
def find_doc(tags):
    from .model import Document, DocumentTag, TagClosure, Tag

    pseudo_tags = []
    normal_tags = []

    for t in tags:
        if t.is_virtual():
            pseudo_tags.append(t)
        else:
            normal_tags.append(t)

    query = Document.select()

    if normal_tags:
        tag_query = None
        for t in fetch_tags(normal_tags):
            desc = TagClosure.descendants(t, include_node=True).select(Tag.id)
            subq = DocumentTag.select(DocumentTag.document_id).where(DocumentTag.tag << desc)
            if tag_query is None:
                tag_query = subq
            else:
                tag_query = tag_query & subq

        query = query.where(Document.id << tag_query)

    if pseudo_tags:
        query = query.where(reduce(op.and_, (p.virtual_query for p in pseudo_tags)))

    for doc in query.iterator():
        print("* ID %d -- %s" % (doc.id, doc.original_path))