In [17]:
import pandas as pd
pd.set_option('display.max_rows', 100)
from techminer2.science_mapping.co_occurrence import communities
from techminer2.refine.thesaurus.descriptors import apply_thesaurus
from techminer2.refine.thesaurus.descriptors import list_cleanup
from techminer2.refine.thesaurus.descriptors import check_integrity
from techminer2.tools import coverage

YEAR = 2017

display(
    coverage(
        field="descriptors",
        #
        # DATABASE PARAMS:
        root_dir="./",
        database="main",
        year_filter=(YEAR, YEAR),
        cited_by_filter=(None, None),
        document_type=[
            'Article',
            'Book chapter',
            'Conference paper',
            'Review',
            'Book',
            'Conference review',
            'Short survey',
            'Letter',
        ]    
    ).tail(20).head(18)
)


list_cleanup(root_dir="./")
check_integrity(root_dir="./")
apply_thesaurus(root_dir="./")


for occ in range(4, 16):

    print('------- '+str(occ)+' -------')    
    display(
        communities(
            #
            # COLUMN PARAMS:
            field="descriptors",
            top_n=None,
            occ_range=(occ, None),
            gc_range=(None, None),
            custom_items=None,
            #
            # NETWORK PARAMS:
            algorithm_or_dict="louvain",
            association_index="association",
            #
            # DATABASE PARAMS:
            root_dir="./",
            database="main",
            year_filter=(YEAR, YEAR),
            cited_by_filter=(None, None),
            document_type=[
                'Article',
                'Book chapter',
                'Conference paper',
                'Review',
                'Book',
                'Conference review',
                'Short survey',
                'Letter',
            ],
        ).head(10)
    )
    


--INFO-- Number of documents : 291
--INFO--   Documents with NA : 0
--INFO--  Efective documents : 291


Unnamed: 0,min_occ,cum_sum_documents,coverage,cum num items
10,27,242,83.16 %,11
11,23,247,84.88 %,13
12,22,247,84.88 %,14
13,19,249,85.57 %,15
14,18,252,86.60 %,16
15,17,262,90.03 %,20
16,15,263,90.38 %,22
17,13,268,92.10 %,28
18,12,269,92.44 %,29
19,11,269,92.44 %,34


--INFO-- Checking `descriptors.the.txt` integrity.
--INFO-- Applying `descriptors.the.txt` thesaurus to author/index keywords and abstract/title words
------- 4 -------


Unnamed: 0,CL_0,CL_1,CL_2,CL_3,CL_4,CL_5
0,DECISION_MAKING 075:0874,BIG_DATA 059:1428,INFORMATION_ANALYSIS 161:2063,BUSINESS_INTELLIGENCE_TOOLS 017:0055,PROJECT_MANAGERS 011:0101,INFORMATION_TECHNOLOGIES 018:0371
1,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,DATA_MINING 046:0744,COMPETITIVE_INTELLIGENCE 124:1627,BUSINESS_PROCESSES 013:0116,INFORMATION_QUALITY 008:0133,COMPETITIVE_ADVANTAGES 017:0192
2,INFORMATION_SYSTEMS 053:0715,DATA_ANALYTICS 032:0953,OPERATIONS_RESEARCH 022:0187,DECISIONS 010:0103,BUSINESS_INTELLIGENCE_SUCCESS 008:0105,COMPETITIVENESS 013:0111
3,DATA_WAREHOUSE 049:0386,ANALYTICS 023:0491,KNOWLEDGE_MANAGEMENT 011:0179,ENTERPRISE_RESOURCE_PLANNING 008:0324,BUSINESS_INTELLIGENCE_PROJECTS 007:0092,BUSINESS_DECISIONS 008:0030
4,INFORMATION_USE 028:0156,DATA_HANDLING 017:0194,EDUCATION 011:0048,OPERATIONAL_BUSINESSES 008:0107,USER_SATISFACTION 007:0084,STRATEGY 007:0032
5,DECISION_SUPPORT_SYSTEM 027:0223,BUSINESS_ANALYTICS 015:0401,PLANNING 009:0032,DATA_PROCESSING 007:0017,SUCCESS_FACTORS 007:0067,BUSINESS_MANAGERS 006:0181
6,ARTIFICIAL_INTELLIGENCE 023:0213,SALES 013:0222,INTERNET_OF_THINGS 007:0507,NETWORK_FUNCTION_VIRTUALIZATION 006:0214,HOSPITALS 006:0085,BUSINESS_MODELS 005:0063
7,DECISION_MAKING_PROCESSES 019:0153,BIG_DATA_ANALYTICS 013:0181,EDUCATION_INSTITUTIONS 007:0037,ENTERPRISE_SYSTEMS 005:0284,SYSTEM_QUALITY 006:0075,BUSINESS_STRATEGY 005:0023
8,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,META_DATA 013:0093,FINDINGS 006:0078,SUPPLY_CHAIN_MANAGEMENT 005:0067,PUBLIC_SECTORS 006:0021,INDUSTRY 004:0183
9,DECISION_MAKERS 015:0182,PREDICTIVE_ANALYTICS 011:0269,PROCESSES 006:0035,BUSINESS_INTELLIGENCE_MATURITY 005:0043,HUMAN_COMPUTER_INTERACTION 005:0037,ADVANTAGES 004:0037


------- 5 -------


Unnamed: 0,CL_0,CL_1,CL_2,CL_3,CL_4
0,INFORMATION_ANALYSIS 161:2063,BIG_DATA 059:1428,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,INFORMATION_TECHNOLOGIES 018:0371,PROJECT_MANAGERS 011:0101
1,COMPETITIVE_INTELLIGENCE 124:1627,DATA_MINING 046:0744,INFORMATION_SYSTEMS 053:0715,COMPETITIVE_ADVANTAGES 017:0192,ENTERPRISE_RESOURCE_PLANNING 008:0324
2,DECISION_MAKING 075:0874,DATA_ANALYTICS 032:0953,INFORMATION_USE 028:0156,COMPETITIVENESS 013:0111,INFORMATION_QUALITY 008:0133
3,DATA_WAREHOUSE 049:0386,ANALYTICS 023:0491,DECISION_SUPPORT_SYSTEM 027:0223,META_DATA 013:0093,BUSINESS_INTELLIGENCE_SUCCESS 008:0105
4,OPERATIONS_RESEARCH 022:0187,DATA_HANDLING 017:0194,ARTIFICIAL_INTELLIGENCE 023:0213,KNOWLEDGE_MANAGEMENT 011:0179,BUSINESS_INTELLIGENCE_PROJECTS 007:0092
5,DECISION_MAKING_PROCESSES 019:0153,BUSINESS_ANALYTICS 015:0401,DECISION_SUPPORT 012:0123,SOCIAL_NETWORKS 009:0267,USER_SATISFACTION 007:0084
6,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,SALES 013:0222,PLANNING 009:0032,RAW_DATA 009:0046,SUCCESS_FACTORS 007:0067
7,BUSINESS_INTELLIGENCE_TOOLS 017:0055,BIG_DATA_ANALYTICS 013:0181,BUSINESS_INTELLIGENCE_TECHNOLOGY 008:0233,SOCIAL_MEDIA 008:0286,SYSTEM_QUALITY 006:0075
8,DECISION_MAKERS 015:0182,BUSINESS_PROCESSES 013:0116,SEARCH_ENGINES 008:0092,BUSINESS_DECISIONS 008:0030,PUBLIC_SECTORS 006:0021
9,BUSINESS_INTELLIGENCE_APPLICATIONS 013:0068,PREDICTIVE_ANALYTICS 011:0269,SELF_SERVICE_BUSINESS_INTELLIGENCE 007:0075,STRATEGY 007:0032,BUSINESS_INTELLIGENCE_PROCESSING 005:0059


------- 6 -------


Unnamed: 0,CL_0,CL_1,CL_2,CL_3
0,INFORMATION_ANALYSIS 161:2063,BIG_DATA 059:1428,OPERATIONS_RESEARCH 022:0187,PROJECT_MANAGERS 011:0101
1,COMPETITIVE_INTELLIGENCE 124:1627,DATA_MINING 046:0744,INFORMATION_TECHNOLOGIES 018:0371,ENTERPRISE_RESOURCE_PLANNING 008:0324
2,DECISION_MAKING 075:0874,DATA_ANALYTICS 032:0953,COMPETITIVE_ADVANTAGES 017:0192,INFORMATION_QUALITY 008:0133
3,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,ANALYTICS 023:0491,BUSINESS_INTELLIGENCE_TOOLS 017:0055,BUSINESS_INTELLIGENCE_SUCCESS 008:0105
4,INFORMATION_SYSTEMS 053:0715,DATA_HANDLING 017:0194,BUSINESS_PROCESSES 013:0116,BUSINESS_INTELLIGENCE_PROJECTS 007:0092
5,DATA_WAREHOUSE 049:0386,BUSINESS_ANALYTICS 015:0401,COMPETITIVENESS 013:0111,USER_SATISFACTION 007:0084
6,INFORMATION_USE 028:0156,SALES 013:0222,KNOWLEDGE_MANAGEMENT 011:0179,SUCCESS_FACTORS 007:0067
7,DECISION_SUPPORT_SYSTEM 027:0223,BIG_DATA_ANALYTICS 013:0181,RAW_DATA 009:0046,HOSPITALS 006:0085
8,ARTIFICIAL_INTELLIGENCE 023:0213,PREDICTIVE_ANALYTICS 011:0269,OPERATIONAL_BUSINESSES 008:0107,SYSTEM_QUALITY 006:0075
9,DECISION_MAKING_PROCESSES 019:0153,CLOUD_COMPUTING 010:0088,BUSINESS_DECISIONS 008:0030,PUBLIC_SECTORS 006:0021


------- 7 -------


Unnamed: 0,CL_0,CL_1,CL_2,CL_3
0,INFORMATION_ANALYSIS 161:2063,BIG_DATA 059:1428,OPERATIONS_RESEARCH 022:0187,COMPETITIVE_ADVANTAGES 017:0192
1,COMPETITIVE_INTELLIGENCE 124:1627,DATA_MINING 046:0744,BUSINESS_PROCESSES 013:0116,COMPETITIVENESS 013:0111
2,DECISION_MAKING 075:0874,DATA_ANALYTICS 032:0953,PROJECT_MANAGERS 011:0101,META_DATA 013:0093
3,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,ANALYTICS 023:0491,ENTERPRISE_RESOURCE_PLANNING 008:0324,KNOWLEDGE_MANAGEMENT 011:0179
4,INFORMATION_SYSTEMS 053:0715,ARTIFICIAL_INTELLIGENCE 023:0213,INFORMATION_QUALITY 008:0133,RAW_DATA 009:0046
5,DATA_WAREHOUSE 049:0386,DATA_HANDLING 017:0194,OPERATIONAL_BUSINESSES 008:0107,
6,INFORMATION_USE 028:0156,BUSINESS_ANALYTICS 015:0401,BUSINESS_INTELLIGENCE_SUCCESS 008:0105,
7,DECISION_SUPPORT_SYSTEM 027:0223,SALES 013:0222,BUSINESS_INTELLIGENCE_PROJECTS 007:0092,
8,DECISION_MAKING_PROCESSES 019:0153,BIG_DATA_ANALYTICS 013:0181,USER_SATISFACTION 007:0084,
9,INFORMATION_TECHNOLOGIES 018:0371,PREDICTIVE_ANALYTICS 011:0269,SUCCESS_FACTORS 007:0067,


------- 8 -------


Unnamed: 0,CL_0,CL_1,CL_2
0,DECISION_MAKING 075:0874,BIG_DATA 059:1428,INFORMATION_ANALYSIS 161:2063
1,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,DATA_MINING 046:0744,COMPETITIVE_INTELLIGENCE 124:1627
2,INFORMATION_SYSTEMS 053:0715,DATA_ANALYTICS 032:0953,OPERATIONS_RESEARCH 022:0187
3,DATA_WAREHOUSE 049:0386,ANALYTICS 023:0491,COMPETITIVE_ADVANTAGES 017:0192
4,INFORMATION_USE 028:0156,DATA_HANDLING 017:0194,COMPETITIVENESS 013:0111
5,DECISION_SUPPORT_SYSTEM 027:0223,BUSINESS_ANALYTICS 015:0401,META_DATA 013:0093
6,ARTIFICIAL_INTELLIGENCE 023:0213,SALES 013:0222,KNOWLEDGE_MANAGEMENT 011:0179
7,DECISION_MAKING_PROCESSES 019:0153,BIG_DATA_ANALYTICS 013:0181,DATA_VISUALISATION 011:0106
8,INFORMATION_TECHNOLOGIES 018:0371,PREDICTIVE_ANALYTICS 011:0269,PROJECT_MANAGERS 011:0101
9,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,CLOUD_COMPUTING 010:0088,EDUCATION 011:0048


------- 9 -------


Unnamed: 0,CL_0,CL_1,CL_2
0,INFORMATION_ANALYSIS 161:2063,DECISION_MAKING 075:0874,INFORMATION_TECHNOLOGIES 018:0371
1,COMPETITIVE_INTELLIGENCE 124:1627,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,COMPETITIVE_ADVANTAGES 017:0192
2,BIG_DATA 059:1428,INFORMATION_SYSTEMS 053:0715,BUSINESS_INTELLIGENCE_TOOLS 017:0055
3,DATA_MINING 046:0744,DATA_WAREHOUSE 049:0386,COMPETITIVENESS 013:0111
4,DATA_ANALYTICS 032:0953,INFORMATION_USE 028:0156,META_DATA 013:0093
5,ANALYTICS 023:0491,DECISION_SUPPORT_SYSTEM 027:0223,KNOWLEDGE_MANAGEMENT 011:0179
6,ARTIFICIAL_INTELLIGENCE 023:0213,DECISION_MAKING_PROCESSES 019:0153,DATA_VISUALISATION 011:0106
7,OPERATIONS_RESEARCH 022:0187,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,VISUALIZATIONS 009:0046
8,DATA_HANDLING 017:0194,DECISION_MAKERS 015:0182,RAW_DATA 009:0046
9,BUSINESS_ANALYTICS 015:0401,DECISION_SUPPORT 012:0123,DASHBOARDS 009:0027


------- 10 -------


Unnamed: 0,CL_0,CL_1
0,INFORMATION_ANALYSIS 161:2063,DECISION_MAKING 075:0874
1,COMPETITIVE_INTELLIGENCE 124:1627,BUSINESS_INTELLIGENCE_SYSTEM 060:0789
2,BIG_DATA 059:1428,INFORMATION_SYSTEMS 053:0715
3,DATA_MINING 046:0744,DATA_WAREHOUSE 049:0386
4,DATA_ANALYTICS 032:0953,INFORMATION_USE 028:0156
5,ANALYTICS 023:0491,DECISION_SUPPORT_SYSTEM 027:0223
6,ARTIFICIAL_INTELLIGENCE 023:0213,DECISION_MAKING_PROCESSES 019:0153
7,OPERATIONS_RESEARCH 022:0187,INFORMATION_TECHNOLOGIES 018:0371
8,DATA_HANDLING 017:0194,COMPETITIVE_ADVANTAGES 017:0192
9,BUSINESS_ANALYTICS 015:0401,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105


------- 11 -------


Unnamed: 0,CL_0,CL_1,CL_2
0,INFORMATION_ANALYSIS 161:2063,DECISION_MAKING 075:0874,BIG_DATA 059:1428
1,COMPETITIVE_INTELLIGENCE 124:1627,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,DATA_ANALYTICS 032:0953
2,DATA_MINING 046:0744,INFORMATION_SYSTEMS 053:0715,ANALYTICS 023:0491
3,ARTIFICIAL_INTELLIGENCE 023:0213,DATA_WAREHOUSE 049:0386,BUSINESS_INTELLIGENCE_TOOLS 017:0055
4,OPERATIONS_RESEARCH 022:0187,INFORMATION_USE 028:0156,BUSINESS_ANALYTICS 015:0401
5,DATA_HANDLING 017:0194,DECISION_SUPPORT_SYSTEM 027:0223,BIG_DATA_ANALYTICS 013:0181
6,COMPETITIVE_ADVANTAGES 017:0192,DECISION_MAKING_PROCESSES 019:0153,
7,SALES 013:0222,INFORMATION_TECHNOLOGIES 018:0371,
8,COMPETITIVENESS 013:0111,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,
9,META_DATA 013:0093,DECISION_MAKERS 015:0182,


------- 12 -------


Unnamed: 0,CL_0,CL_1,CL_2,CL_3
0,DECISION_MAKING 075:0874,INFORMATION_ANALYSIS 161:2063,BIG_DATA 059:1428,INFORMATION_TECHNOLOGIES 018:0371
1,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,COMPETITIVE_INTELLIGENCE 124:1627,DATA_ANALYTICS 032:0953,COMPETITIVE_ADVANTAGES 017:0192
2,INFORMATION_SYSTEMS 053:0715,DATA_MINING 046:0744,ANALYTICS 023:0491,BUSINESS_INTELLIGENCE_TOOLS 017:0055
3,DATA_WAREHOUSE 049:0386,ARTIFICIAL_INTELLIGENCE 023:0213,DATA_HANDLING 017:0194,COMPETITIVENESS 013:0111
4,INFORMATION_USE 028:0156,OPERATIONS_RESEARCH 022:0187,BUSINESS_ANALYTICS 015:0401,
5,DECISION_SUPPORT_SYSTEM 027:0223,SALES 013:0222,BIG_DATA_ANALYTICS 013:0181,
6,DECISION_MAKING_PROCESSES 019:0153,META_DATA 013:0093,BUSINESS_INTELLIGENCE_APPLICATIONS 013:0068,
7,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,,,
8,DECISION_MAKERS 015:0182,,,
9,BUSINESS_PROCESSES 013:0116,,,


------- 13 -------


Unnamed: 0,CL_0,CL_1,CL_2
0,INFORMATION_ANALYSIS 161:2063,BIG_DATA 059:1428,INFORMATION_TECHNOLOGIES 018:0371
1,COMPETITIVE_INTELLIGENCE 124:1627,DATA_ANALYTICS 032:0953,COMPETITIVE_ADVANTAGES 017:0192
2,DECISION_MAKING 075:0874,ANALYTICS 023:0491,BUSINESS_INTELLIGENCE_TOOLS 017:0055
3,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,DATA_HANDLING 017:0194,COMPETITIVENESS 013:0111
4,INFORMATION_SYSTEMS 053:0715,BUSINESS_ANALYTICS 015:0401,
5,DATA_WAREHOUSE 049:0386,BIG_DATA_ANALYTICS 013:0181,
6,DATA_MINING 046:0744,BUSINESS_INTELLIGENCE_APPLICATIONS 013:0068,
7,INFORMATION_USE 028:0156,,
8,DECISION_SUPPORT_SYSTEM 027:0223,,
9,ARTIFICIAL_INTELLIGENCE 023:0213,,


------- 14 -------


Unnamed: 0,CL_0,CL_1
0,DECISION_MAKING 075:0874,INFORMATION_ANALYSIS 161:2063
1,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,COMPETITIVE_INTELLIGENCE 124:1627
2,INFORMATION_SYSTEMS 053:0715,BIG_DATA 059:1428
3,DATA_WAREHOUSE 049:0386,DATA_MINING 046:0744
4,INFORMATION_USE 028:0156,DATA_ANALYTICS 032:0953
5,DECISION_SUPPORT_SYSTEM 027:0223,ANALYTICS 023:0491
6,DECISION_MAKING_PROCESSES 019:0153,ARTIFICIAL_INTELLIGENCE 023:0213
7,INFORMATION_TECHNOLOGIES 018:0371,OPERATIONS_RESEARCH 022:0187
8,COMPETITIVE_ADVANTAGES 017:0192,DATA_HANDLING 017:0194
9,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,BUSINESS_ANALYTICS 015:0401


------- 15 -------


Unnamed: 0,CL_0,CL_1
0,DECISION_MAKING 075:0874,INFORMATION_ANALYSIS 161:2063
1,BUSINESS_INTELLIGENCE_SYSTEM 060:0789,COMPETITIVE_INTELLIGENCE 124:1627
2,INFORMATION_SYSTEMS 053:0715,BIG_DATA 059:1428
3,DATA_WAREHOUSE 049:0386,DATA_MINING 046:0744
4,INFORMATION_USE 028:0156,DATA_ANALYTICS 032:0953
5,DECISION_SUPPORT_SYSTEM 027:0223,ANALYTICS 023:0491
6,DECISION_MAKING_PROCESSES 019:0153,ARTIFICIAL_INTELLIGENCE 023:0213
7,INFORMATION_TECHNOLOGIES 018:0371,OPERATIONS_RESEARCH 022:0187
8,COMPETITIVE_ADVANTAGES 017:0192,DATA_HANDLING 017:0194
9,BUSINESS_INTELLIGENCE_SOLUTIONS 017:0105,BUSINESS_ANALYTICS 015:0401
