/
__init__.py
69 lines (59 loc) · 2.13 KB
/
__init__.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
"""Keyword extraction/tagger for fabric8-analytics."""
__version_info__ = ('0', '1')
__version__ = '.'.join(__version_info__)
__title__ = 'fabric8-analytics-tagger'
__author__ = 'Fridolin Pokorny'
__license__ = 'ASL 2.0'
__copyright__ = 'Copyright 2017 Fridolin Pokorny'
from .corpus import Corpus
from .errors import RemoteDependencyMissingError
from .keywords_chief import KeywordsChief
from .recipes import aggregate
from .recipes import collect
from .recipes import get_registered_collectors
from .recipes import get_registered_scorers
from .recipes import get_registered_stemmers
from .recipes import lookup_file
from .recipes import lookup_readme
from .recipes import lookup_text
from .recipes import reckon
from .tokenizer import Tokenizer
assert Corpus
assert RemoteDependencyMissingError
assert KeywordsChief
assert aggregate
assert collect
assert get_registered_collectors
assert get_registered_scorers
assert get_registered_stemmers
assert lookup_file
assert lookup_readme
assert lookup_text
assert reckon
assert Tokenizer
def prepare():
"""Prepare tagger for run.
This should be after installation to initialize tagger's resources.
"""
import nltk
import requests
from libarchive import extract_memory
import os
from shutil import move
from f8a_tagger.utils import get_files_dir
nltk.download("punkt")
nltk.download("wordnet")
maven_index_checker_url = 'https://github.com/fabric8-analytics/' \
'maven-index-checker/files/1275145/' \
'maven-index-checker-v0.1-alpha.zip'
response = requests.get(maven_index_checker_url)
if response.ok is not True:
raise RemoteDependencyMissingError("Failed to download maven-index-checker with "
"response code %s",
response.status_code)
# Unfortunately no way how to know name or path of extracted file,
# so assume it's maven-index-checker.jar
jar_name = "maven-index-checker.jar"
jar_path = get_files_dir()
extract_memory(response.content)
move(jar_name, os.path.join(jar_path, jar_name))