# Job Description Preprocessing and Extraction
This notebook is designed to call all functions from the Utils script, preprocess the *aufgaben* content, and extract sentence units and meaningful phrases.

In [6]:
import pandas as pd
from pathlib import Path
import config as C
from utils import (dedupe_lines, clean_text, split_units, extract_phrases, embed_texts, df_to_sqlite, as_json, get_spacy, find_span_in_text)

In [8]:
input_csv = Path(C.JOBS_INPUT_CSV)   #job_details file with the raw job descriptions
sqlite_out = Path(C.SQLITE_PATH)     #sqlite database where everything will be stored

print("Input CSV:", input_csv)
print("Output SQLite file:", sqlite_out)


Input CSV: /Users/denysheryavenko/Desktop/EL Thesis/data/job_details.csv
Output SQLite file: /Users/denysheryavenko/Desktop/EL Thesis/data/db.sqlite


In [10]:
#we check if there is an id column in the raw job dataset, if not, we create it, to have a primary key
def pick_or_create_job_id(df):
  
    for col in C.ID_CANDIDATES:
        if col in df.columns:
            return col

    df["job_id"] = df.reset_index().index + 1
    return "job_id"

### Load the raw data and inspect it

In [13]:
df = pd.read_csv(input_csv)
print("Total rows:", len(df))
print("Columns:", list(df.columns))

#check if exists:
if C.COL_TITLE not in df.columns:
    df[C.COL_TITLE] = ""

if C.COL_TEXT not in df.columns:
    raise ValueError("The text column '" + C.COL_TEXT + "' is missing.")

# identify or create a job ID
id_col = pick_or_create_job_id(df)

# summary
variables = []
dtypes = []
missing = []
not_missing = []

for col in df.columns:
    variables.append(col)
    dtypes.append(str(df[col].dtype))
    missing.append(df[col].isna().sum())
    not_missing.append(df[col].notna().sum())

schema_summary = pd.DataFrame({
    "variable": variables,
    "dtype": dtypes,
    "missing": missing,
    "non_missing": not_missing
})

print("Schema and missing values:")
display(schema_summary)



Total rows: 400
Columns: ['title', 'url', 'deadline', 'location', 'aufgaben', 'erfordernisse']
Schema and missing values:


Unnamed: 0,variable,dtype,missing,non_missing
0,title,object,0,400
1,url,object,0,400
2,deadline,object,0,400
3,location,object,0,400
4,aufgaben,object,25,375
5,erfordernisse,object,7,393
6,job_id,int64,0,400


### Clean and Dedupe Text

In [16]:
#### assisting viz to wrap the text when printing
from IPython.display import HTML

pd.set_option("display.max_colwidth", None)
pd.set_option("display.expand_frame_repr", False)
pd.set_option("display.width", 1000)

HTML("""
<style>
.output_area pre {
    white-space: pre-wrap;
}
</style>
""")
####

# dedupe the text
deduped_list = []
for text in df[C.COL_TEXT].fillna(""):
    deduped_list.append(dedupe_lines(text))
df["text_deduped"] = deduped_list

# simple cleaning with structure
clean_list = []
for text in df["text_deduped"]:
    clean_list.append(clean_text(text))
df["text_clean"] = clean_list

#show some examples
display(df[[id_col, C.COL_TEXT, "text_deduped", "text_clean"]].head(1))


Unnamed: 0,job_id,aufgaben,text_deduped,text_clean
0,1,"Die Verwendung als Vertragshochschullehrperson/Hochschullehrperson an der Privaten Pädagogischen Hochschule Burgenland erfolgt gem. § 48g des VBG bzw. § 200d BDG 1979.\nSie erfüllen Aufgaben und Tätigkeiten insbesondere in folgenden Bereichen:\n•\tLehre in Aus-, Fort- und Weiterbildung im Bereich der Primarstufe mit Fokus auf Sprachliche Bildung und Inklusive Pädagogik\n•\tBeratung von Studierenden, insbesondere Betreuung bei der Absolvierung der päda-gogisch-praktischen Studien und der Erstellung von Qualifizierungsarbeiten\n•\tMitarbeit im Zentrum für Minderheitenschulwesen, Mehrsprachigkeit und Inklusion\n•\tMitarbeit bei Aufgaben in der wissenschaftlich-berufsfeldbezogenen Forschung im ausgeschriebenen Bereich\n•\tMitwirkung an Organisations- und Verwaltungsaufgaben, einschließlich der\nEvaluierung und Qualitätssicherung im ausgeschriebenen Bereich\n•\tEntwicklung und Betreuung von Bildungsangeboten (Aus-, Fort- und Weiterbildung) im ausgeschriebenen Bereich\nDie Verwendung als Vertragshochschullehrperson/Hochschullehrperson an der Privaten Pädagogischen Hochschule Burgenland erfolgt gem. § 48g des VBG bzw. § 200d BDG 1979.\nSie erfüllen Aufgaben und Tätigkeiten insbesondere in folgenden Bereichen:\n•\tLehre in Aus-, Fort- und Weiterbildung im Bereich der Primarstufe mit Fokus auf Sprachliche Bildung und Inklusive Pädagogik\n•\tBeratung von Studierenden, insbesondere Betreuung bei der Absolvierung der päda-gogisch-praktischen Studien und der Erstellung von Qualifizierungsarbeiten\n•\tMitarbeit im Zentrum für Minderheitenschulwesen, Mehrsprachigkeit und Inklusion\n•\tMitarbeit bei Aufgaben in der wissenschaftlich-berufsfeldbezogenen Forschung im ausgeschriebenen Bereich\n•\tMitwirkung an Organisations- und Verwaltungsaufgaben, einschließlich der\nEvaluierung und Qualitätssicherung im ausgeschriebenen Bereich\n•\tEntwicklung und Betreuung von Bildungsangeboten (Aus-, Fort- und Weiterbildung) im ausgeschriebenen Bereich\nDie Verwendung als Vertragshochschullehrperson/Hochschullehrperson an der Privaten Pädagogischen Hochschule Burgenland erfolgt gem. § 48g des VBG bzw. § 200d BDG 1979.\nSie erfüllen Aufgaben und Tätigkeiten insbesondere in folgenden Bereichen:\n•\tLehre in Aus-, Fort- und Weiterbildung im Bereich der Primarstufe mit Fokus auf Sprachliche Bildung und Inklusive Pädagogik\n•\tBeratung von Studierenden, insbesondere Betreuung bei der Absolvierung der päda-gogisch-praktischen Studien und der Erstellung von Qualifizierungsarbeiten\n•\tMitarbeit im Zentrum für Minderheitenschulwesen, Mehrsprachigkeit und Inklusion\n•\tMitarbeit bei Aufgaben in der wissenschaftlich-berufsfeldbezogenen Forschung im ausgeschriebenen Bereich\n•\tMitwirkung an Organisations- und Verwaltungsaufgaben, einschließlich der\nEvaluierung und Qualitätssicherung im ausgeschriebenen Bereich\n•\tEntwicklung und Betreuung von Bildungsangeboten (Aus-, Fort- und Weiterbildung) im ausgeschriebenen Bereich","Die Verwendung als Vertragshochschullehrperson/Hochschullehrperson an der Privaten Pädagogischen Hochschule Burgenland erfolgt gem. § 48g des VBG bzw. § 200d BDG 1979.\nSie erfüllen Aufgaben und Tätigkeiten insbesondere in folgenden Bereichen:\n•\tLehre in Aus-, Fort- und Weiterbildung im Bereich der Primarstufe mit Fokus auf Sprachliche Bildung und Inklusive Pädagogik\n•\tBeratung von Studierenden, insbesondere Betreuung bei der Absolvierung der päda-gogisch-praktischen Studien und der Erstellung von Qualifizierungsarbeiten\n•\tMitarbeit im Zentrum für Minderheitenschulwesen, Mehrsprachigkeit und Inklusion\n•\tMitarbeit bei Aufgaben in der wissenschaftlich-berufsfeldbezogenen Forschung im ausgeschriebenen Bereich\n•\tMitwirkung an Organisations- und Verwaltungsaufgaben, einschließlich der\nEvaluierung und Qualitätssicherung im ausgeschriebenen Bereich\n•\tEntwicklung und Betreuung von Bildungsangeboten (Aus-, Fort- und Weiterbildung) im ausgeschriebenen Bereich","Die Verwendung als Vertragshochschullehrperson/Hochschullehrperson an der Privaten Pädagogischen Hochschule Burgenland erfolgt gem. 48g des VBG bzw. 200d BDG 1979.\nSie erfüllen Aufgaben und Tätigkeiten insbesondere in folgenden Bereichen:\n• Lehre in Aus-, Fort- und Weiterbildung im Bereich der Primarstufe mit Fokus auf Sprachliche Bildung und Inklusive Pädagogik\n• Beratung von Studierenden, insbesondere Betreuung bei der Absolvierung der päda-gogisch-praktischen Studien und der Erstellung von Qualifizierungsarbeiten\n• Mitarbeit im Zentrum für Minderheitenschulwesen, Mehrsprachigkeit und Inklusion\n• Mitarbeit bei Aufgaben in der wissenschaftlich-berufsfeldbezogenen Forschung im ausgeschriebenen Bereich\n• Mitwirkung an Organisations- und Verwaltungsaufgaben, einschließlich der\nEvaluierung und Qualitätssicherung im ausgeschriebenen Bereich\n• Entwicklung und Betreuung von Bildungsangeboten (Aus-, Fort- und Weiterbildung) im ausgeschriebenen Bereich"


### Save Cleaned Jobs to SQL

In [19]:
df_jobs_clean = df[[id_col, C.COL_TITLE, "text_deduped", "text_clean"]].copy()
df_to_sqlite(df_jobs_clean, sqlite_out, "jobs_clean")

print("Saved", len(df_jobs_clean), "rows to the table 'jobs_clean' in the file:", sqlite_out)


Saved 400 rows to the table 'jobs_clean' in the file: /Users/denysheryavenko/Desktop/EL Thesis/data/db.sqlite


### Split Clean Job Descriptions into Units

In [22]:
nlp = get_spacy()
rows = []

#we iterate through each row and split based on the rules from utils
for index, row in df.iterrows():
    text = row["text_clean"]

    units = split_units(text, nlp, min_words_per_unit=C.MIN_WORDS_PER_UNIT) #min words per unit avoids cases like und, z.B., etc. ...

    #we keep units 
    for u in units:
        if len(u) > 2: # and here we try to remove any leftover symbols like dashes, bullets that became units (just to be safe)...
        
            start, end = find_span_in_text(text, u, allow_fuzzy=False)
            rows.append((row[id_col], u, start, end))

print("Total units extracted:", len(rows))

# some statistics
if len(rows) > 0:

    job_unit_count = {} #number of units per job

    for job_id, unit, start, end in rows:
        if job_id not in job_unit_count:
            job_unit_count[job_id] = 0
        job_unit_count[job_id] += 1

    counts = list(job_unit_count.values())

    units_summary = pd.DataFrame({
        "": ["Jobs with units", "Min. units per job", "Max. units per job", "Avg. units per job"],
        "value": [
            len(job_unit_count),
            min(counts),
            max(counts),
            round(sum(counts)/len(counts), 2)
        ],
    })

    print("Unit summary per job:")
    display(units_summary)



Total units extracted: 2798
Unit summary per job:


Unnamed: 0,Unnamed: 1,value
0,Jobs with units,375.0
1,Min. units per job,1.0
2,Max. units per job,45.0
3,Avg. units per job,7.46


### Embed Units and Load to SQL
The embedding process is done in smaller batches, because doing this all at once can crash the memory or be too slow.

In [25]:
parts = [] #this list holds the small dataframes before joining them to the main table

if len(rows) > 0:

    #go through the rows in small batches
    start_idx = 0
    while start_idx < len(rows):
        end_idx = start_idx + C.EMBED_BATCH_SIZE
        batch = rows[start_idx:end_idx]
        
        texts = []
        job_ids_for_batch = []
        unit_starts = []
        unit_ends = []

        for item in batch:
            job_id, unit_text, u_start, u_end = item
            job_ids_for_batch.append(job_id)
            texts.append(unit_text)
            unit_starts.append(u_start)
            unit_ends.append(u_end)

        #create the embeddings for this batch
        vectors = embed_texts(texts)

        #convert to json to store later
        embedding_json_list = []
        for v in vectors:
            embedding_json_list.append(as_json(v))

        #build a small data frame for this batch and add it to "parts"
        temp = pd.DataFrame({
            id_col: job_ids_for_batch,
            "unit_text": texts,
            "unit_start": unit_starts, #span start
            "unit_end": unit_ends, # span end
            "embedding_json": embedding_json_list
        })
        parts.append(temp)

        start_idx = end_idx  # move to the next batch

    #finally combine all batch data frames into one
    df_units = pd.concat(parts, ignore_index=True)

else:
    # in case there are no units at all (rare, but avoids errors)
    df_units = pd.DataFrame(columns=[id_col, "unit_text", "unit_start", "unit_end", "embedding_json"])

df_to_sqlite(df_units, sqlite_out, "job_units")

print("Saved", len(df_units))
print("First 5 embedded units:")
display(df_units.head(5))

Saved 2798
First 5 embedded units:


Unnamed: 0,job_id,unit_text,unit_start,unit_end,embedding_json
0,1,Die Verwendung als Vertragshochschullehrperson/Hochschullehrperson an der Privaten Pädagogischen Hochschule Burgenland erfolgt gem. 48g des VBG bzw. 200d BDG 1979.,0.0,163.0,"[-0.0467069074511528, 0.07633580267429352, 0.014378831721842289, -0.06591174006462097, -0.018646089360117912, -0.055108193308115005, -0.055728789418935776, 0.043197277933359146, -0.031259842216968536, 0.0607299841940403, -0.027741484344005585, 0.0465974323451519, 0.013985693454742432, -0.010024764575064182, 0.0006732718320563436, 0.003746406640857458, -0.0407872311770916, 0.06492248922586441, 0.11102385818958282, 0.009165982715785503, 0.0019169887527823448, 0.023175017908215523, -0.04300393536686897, -0.009107372723519802, 0.012004981748759747, -0.01820218935608864, 0.013675807043910027, -0.09065210819244385, 0.012825148180127144, -0.02829897031188011, -0.025130396708846092, -0.07788825780153275, -0.00947112962603569, -0.034796856343746185, -0.04851222410798073, 0.037638962268829346, 0.051352087408304214, 0.015244615264236927, 0.018196387216448784, -0.025787409394979477, -0.03999375179409981, -0.018948683515191078, -0.014552670530974865, 0.072743259370327, -0.035460665822029114, -0.009560085833072662, -0.08099948614835739, -0.011046198196709156, -0.11107669025659561, -0.05189419537782669, 0.02468244358897209, -0.002245720010250807, -0.04189645126461983, 0.04640894755721092, -0.011343390680849552, -0.02474522776901722, 0.09367907792329788, 0.025170041248202324, -0.02728627249598503, 0.014774003997445107, -0.08868058770895004, 0.09395807236433029, -0.011947584338486195, -0.01855204440653324, 0.011676546186208725, -0.014602135866880417, -0.022060738876461983, 0.04882935434579849, 0.0584370382130146, -0.013440917246043682, -0.06643152981996536, -0.09199093282222748, -0.0127731217071414, 0.07183413952589035, 0.07565333694219589, 0.013732723891735077, -0.05077660456299782, 0.1391603797674179, 0.06268829852342606, -0.10662790387868881, 0.09438852220773697, -0.009814027696847916, 0.03265304118394852, -0.019270312041044235, -0.06691306829452515, -0.06500685960054398, -0.02224516123533249, -0.003026350401341915, 0.05533917620778084, -0.03291229531168938, 0.01927092671394348, -0.08305671066045761, -0.01731819286942482, -0.07915724813938141, -0.022380558773875237, 0.024143753573298454, -0.03985020890831947, -0.0164254829287529, 0.0065809087827801704, 0.09058734774589539, -0.05062597990036011, -0.03837648779153824, 0.017477741464972496, 0.03419307991862297, -0.06553729623556137, 0.057305313646793365, 0.018860185518860817, -0.03166412189602852, -0.05224459990859032, -0.05645929276943207, -0.04273909702897072, -0.04116499423980713, -0.003142709843814373, -0.00669092359021306, -0.05129961296916008, 0.009708082303404808, 0.0381058007478714, 0.0011397501220926642, 0.060570940375328064, 0.03486655652523041, -0.008617510087788105, -0.0074234954081475735, -0.016780734062194824, -0.12026256322860718, -0.010697842575609684, -0.0019364830804988742, -0.03071577660739422, -0.018017806112766266, 0.006009502802044153, -0.023742178454995155, 0.04625953733921051, 0.043914709240198135, 0.007292511407285929, 0.035484280437231064, 0.032004036009311676, 0.007546125911176205, 0.019922899082303047, 0.02181340754032135, 0.024847203865647316, -0.04111132770776749, 0.020474320277571678, 0.06980962306261063, 0.03073013760149479, 0.03793172165751457, -0.03060549683868885, 0.06556032598018646, 0.03920494019985199, 0.1610822081565857, 0.06605690717697144, 0.056832119822502136, 0.037126325070858, 0.04701727256178856, 0.06286271661520004, -0.005124077200889587, -0.07840447127819061, 0.051445845514535904, 0.018771549686789513, 0.0052757360972464085, 0.09255879372358322, -0.03150446340441704, -0.044555749744176865, 0.02215629443526268, 0.1252775937318802, -0.06660842895507812, 0.07357212901115417, 0.0533977746963501, 0.048299312591552734, -0.11215689033269882, 0.04566865786910057, -0.019671762362122536, 0.05047733336687088, 0.03714488446712494, 0.02583218365907669, 0.01818600855767727, 0.02397136390209198, -0.03301570564508438, 0.011384261772036552, 0.042299676686525345, 0.016935760155320168, 0.0112204160541296, -0.034704744815826416, -0.011087307706475258, 0.027848275378346443, -0.039493072777986526, 0.05310678854584694, 0.039375267922878265, 0.03129279986023903, -0.13240166008472443, 0.019533205777406693, 0.12357765436172485, -0.046800412237644196, -0.05226687341928482, -0.006862251088023186, -0.15436077117919922, -0.07628770172595978, 0.007676613982766867, 0.1583966612815857, -0.17841550707817078, 0.027304770424962044, -0.006826978176832199, 0.010970311239361763, 0.06738060712814331, -0.012658396735787392, 0.022211402654647827, -0.021804850548505783, -0.023540537804365158, 0.016626793891191483, -0.03488040715456009, 0.022301698103547096, 0.006657407619059086, -0.007730699144303799, -0.012681687250733376, -0.032347533851861954, -0.003947713878005743, -0.009963763877749443, 0.03595975786447525, -0.005043564364314079, 0.036714572459459305, -0.02230105921626091, 0.03623174875974655, -0.038689855486154556, 0.07322120666503906, -0.026172785088419914, -0.07778193056583405, -0.009748647920787334, 0.04247858375310898, -0.0806596651673317, 0.0329156294465065, 0.017458004876971245, -0.04645566642284393, 0.02955896221101284, -0.05513608083128929, 0.008988233283162117, 0.024808337911963463, 0.015569660812616348, -0.10477470606565475, 0.015352189540863037, 0.025028875097632408, -0.08217309415340424, 0.033418383449316025, -0.014773552305996418, -0.031131254509091377, -0.09489723294973373, -0.0228028055280447, 0.01737341657280922, 0.027129417285323143, 0.029062118381261826, 0.07810600101947784, 0.05058804899454117, -0.09441983699798584, -0.02688458189368248, -0.015620145946741104, -0.03219779208302498, -0.003597820643335581, 0.07804906368255615, 0.027029525488615036, 0.035887934267520905, 0.01565956324338913, -0.030244391411542892, -0.13009768724441528, 0.08658041805028915, 0.030641254037618637, 0.005865495651960373, 0.005398833658546209, 0.05082214996218681, -0.05569758638739586, -0.041307300329208374, -0.024027356877923012, -0.03226809576153755, 0.019312240183353424, -0.014033808372914791, -0.012437325902283192, 0.03043530508875847, -0.00044122253893874586, -0.04506516829133034, -0.06706687062978745, 0.04563238099217415, 0.020431824028491974, 0.00816814973950386, -0.012419378384947777, -0.02000003308057785, 0.031696029007434845, 0.05362217500805855, -0.006213210057467222, 0.0850767120718956, 0.03020484745502472, -0.08840929716825485, 0.007422175724059343, -0.04914214834570885, 0.04666643589735031, -0.0019055756274610758, 0.03600533679127693, -0.055258609354496, 0.0365729033946991, 0.024866217747330666, 0.0395331010222435, -0.02040116675198078, 0.012283964082598686, -0.09095364809036255, 0.008721982128918171, 0.07891932874917984, 0.021160364151000977, -0.07335124909877777, -0.008582919836044312, -0.05201148986816406, -0.07327473163604736, 0.0014694039709866047, 0.0023564693983644247, -0.02758035622537136, 0.002830138895660639, 0.042114343494176865, -0.09750883281230927, 0.06910033524036407, -0.03796767443418503, 0.010553328320384026, -0.01951608993113041, -0.04493981972336769, -0.10305498540401459, 0.02818433567881584, -0.06086467206478119, 0.010882709175348282, -0.08728405833244324, 0.0006000638240948319, 0.05053448677062988, 0.04909206181764603, -0.010646233335137367, -0.053156111389398575, 0.01993846707046032, -0.05631391704082489, 0.07764104008674622, -0.02105010859668255, -0.06647342443466187, -0.032244693487882614, -0.022221367806196213, 0.05767560377717018, -0.04483233019709587, 0.031185783445835114, 0.0672229677438736, 0.07057451456785202, -0.00635960279032588, -0.010154657997190952, -0.03374030813574791, -0.022893080487847328, 0.09179365634918213, -0.11012488603591919, -0.02353598177433014, 0.04136819764971733, 0.10435358434915543, -0.05653555691242218, 0.0021894900128245354, -0.0151581522077322, 0.06262315064668655, 0.035734422504901886, -0.05626446753740311, 0.03666262701153755, 0.020529206842184067, -0.0003452734963502735, -0.02508998103439808, 0.08052171021699905, 0.036007605493068695, 0.022048546001315117, -0.07145605236291885, 0.06132640689611435, 0.000377048272639513, 0.06794004142284393, 0.01613495498895645, -0.030861305072903633, 0.06871449947357178, -0.02002665400505066, 0.0890304371714592, -0.04027740657329559, 0.041991643607616425, 0.0261358805000782, -0.08933147042989731, 0.06808802485466003, -0.040143292397260666, 0.024649687111377716, -0.057980313897132874, -0.05494994670152664, 0.013592386618256569, -0.06144354119896889, 0.05847597494721413, -0.027126697823405266, 0.059248488396406174]"
1,1,Sie erfüllen Aufgaben und Tätigkeiten insbesondere in folgenden Bereichen:,164.0,238.0,"[0.014505060389637947, -0.030078105628490448, 0.018849607557058334, 0.009000302292406559, -0.03201911970973015, -0.003859644988551736, 0.02968871220946312, 0.030092991888523102, -0.04836520552635193, 0.0528617724776268, 0.00024576688883826137, -0.01773758791387081, -0.022695837542414665, 0.011038931086659431, 0.05559081956744194, 0.021550176665186882, 0.03229827433824539, -0.016891758888959885, 0.003870707703754306, -0.01172620803117752, 0.024412227794528008, -0.0567033626139164, -0.015940358862280846, -0.023765597492456436, -0.02081952802836895, 0.018136922270059586, -0.09934470057487488, -0.030688557773828506, 0.016590120270848274, -0.0633535236120224, -0.022705934941768646, 0.012390900403261185, 0.06625539809465408, 0.037805721163749695, -0.031761284917593, 0.09593552350997925, -0.005715162493288517, 0.003020145930349827, 0.04096497595310211, -0.0300129521638155, 0.025263847783207893, -0.07994072884321213, 0.02661142125725746, 0.01218626368790865, 0.00017866790585685521, -0.05857718363404274, -0.004688336048275232, -0.036082517355680466, -0.06549485772848129, -0.040639474987983704, -0.03288988396525383, -0.06722155213356018, 0.011980893090367317, 0.014828071929514408, -0.00828830897808075, 0.013522655703127384, 0.07583703100681305, 0.05065559595823288, 0.009354022331535816, 0.020560942590236664, 0.09175027161836624, 0.015639537945389748, -0.09858547151088715, 0.03666362166404724, 0.03191409260034561, -0.020712653174996376, 0.051039356738328934, 0.03134351968765259, -0.07254046946763992, 0.060915544629096985, -0.08227697759866714, -0.02806089259684086, -0.013998957350850105, -0.04128521680831909, 0.039639804512262344, -0.013019867241382599, -0.010220269672572613, -0.029847608879208565, -0.003576794406399131, -0.015902463346719742, 0.04582943394780159, 0.0002588370116427541, 0.04347727447748184, 0.08128199726343155, -0.000498852226883173, 0.0357077531516552, -0.013541140593588352, 0.008392583578824997, 0.051928240805864334, -0.02445089817047119, 0.006371465511620045, -0.013608806766569614, 0.02531297318637371, -0.08186636120080948, 0.031464144587516785, 0.002649573376402259, 0.012082258239388466, -0.0031230226159095764, 0.022845717146992683, 0.08926524221897125, -0.030774148181080818, 0.06924676150083542, 0.004745743237435818, -0.0663766860961914, -0.018869368359446526, 0.014851680025458336, -0.04037440940737724, -0.11946213990449905, -0.021206384524703026, 0.02959405444562435, -0.055075753480196, 0.03856150060892105, -0.10122141242027283, -0.03227531909942627, -0.028108546510338783, -0.06211262568831444, -0.014967003837227821, 0.03029031679034233, 0.004468414932489395, 0.03632611036300659, -0.005920480936765671, -0.047225408256053925, 0.09490624815225601, -0.04984107241034508, 0.07154971361160278, -0.003991721663624048, -0.041549164801836014, 0.00690986355766654, -0.003879603696987033, -0.06202371418476105, 0.03612416237592697, 0.012644714675843716, -0.0619245283305645, -0.006093544885516167, -0.024866878986358643, -0.0058526452630758286, 0.1118827685713768, -0.055548690259456635, -0.01341244112700224, 0.1083720400929451, 0.04155600443482399, 0.09277476370334625, 0.14931292831897736, 0.04555108770728111, 0.024910133332014084, 0.056854113936424255, -0.0704057440161705, -0.02043093368411064, 0.01675526425242424, 0.04331627115607262, 0.054080232977867126, -0.009715410880744457, 0.11242574453353882, 0.034312956035137177, -6.090859096730128e-05, 0.00026527870795689523, -0.11071093380451202, -0.03738855943083763, 0.10257285833358765, -0.02415657229721546, -0.10547836124897003, 0.07039672136306763, -0.0008912172634154558, 0.08459535241127014, -0.0860208123922348, -0.03754420951008797, 0.022426621988415718, -0.037399083375930786, -0.033988017588853836, 0.022793525829911232, 0.015753043815493584, 0.014111824333667755, 0.06702769547700882, -0.024323605000972748, 0.015408824197947979, 0.02936043217778206, -0.025921516120433807, 0.02078450471162796, -0.0006794179789721966, -0.0014583246083930135, 0.11754210293292999, -0.07125196605920792, 0.033839307725429535, -0.00891483947634697, 0.004265000578016043, 0.01784958876669407, 0.034701623022556305, 0.023687664419412613, 0.016060635447502136, -0.0351111926138401, -0.1310368776321411, -0.0043434142135083675, 0.03113068826496601, 0.06029534339904785, -0.02673061564564705, -0.03128752484917641, 0.11206290870904922, -0.02734229899942875, -0.007193787954747677, 0.025590939447283745, -0.06319630146026611, 0.010479756630957127, -0.04430760070681572, 0.03376363217830658, -0.00022419217566493899, -0.019071480259299278, -0.014512516558170319, 0.05808120220899582, 0.04294442757964134, -0.062070369720458984, -0.07120897620916367, -0.013809127733111382, -0.002925107255578041, -0.0589342825114727, 0.038856543600559235, -0.022723499685525894, -0.02668435499072075, 0.026515474542975426, -0.06504584103822708, 0.003858319716528058, -0.06420845538377762, 0.07544445246458054, 0.0192863866686821, -0.09630730748176575, -0.06774409860372543, 0.039640046656131744, -0.08503066748380661, 0.029617605730891228, 0.0029374375008046627, -0.014665408991277218, -0.03708076849579811, -0.10822037607431412, 0.05140449479222298, 0.019276220351457596, -0.14395186305046082, -0.020685499534010887, -0.018091678619384766, 0.012755138799548149, -0.02448510006070137, -0.02399703860282898, -0.014795192517340183, 0.006436681374907494, -0.04022722318768501, 0.0335032157599926, -0.03911798819899559, 0.11405280977487564, 0.05311600863933563, 0.06098976731300354, -0.04323364421725273, 0.08627986162900925, -0.05979602411389351, -0.12261883914470673, -0.023608248680830002, -0.047003455460071564, -0.044276874512434006, -0.01941153034567833, -0.0001084447794710286, -0.013024603947997093, -0.03290416672825813, 0.03925860673189163, -0.02252991870045662, 0.024924365803599358, 0.0363353006541729, 0.07890097796916962, 0.08872399479150772, -0.02712608128786087, 0.03306080773472786, 0.039341039955616, 0.0017703884514048696, 0.00035856119939126074, -0.08954212814569473, -0.02089698240160942, -0.10833026468753815, -0.05073630437254906, -0.00263291341252625, -0.09500676393508911, -0.047993119806051254, -0.09491003304719925, 0.06003465875983238, 0.124969981610775, 0.017724527046084404, -0.09464682638645172, -0.005205186549574137, 0.0029057685751467943, 0.0009494530386291444, 0.011673429049551487, 0.07253265380859375, 0.06489858776330948, -0.03610005974769592, 0.04448786750435829, 0.02082974649965763, 0.006426322739571333, -0.002522968454286456, -0.06471355259418488, 0.015645425766706467, -0.010537398047745228, 0.006180884782224894, -0.052186112850904465, -0.1519302874803543, -0.004171452019363642, 0.03238629549741745, -0.031202999874949455, -0.011210296303033829, -0.0023518544621765614, 0.03409549593925476, -0.0071968506090343, 0.01740133762359619, 0.01720886491239071, -0.04401020333170891, 0.07424387335777283, -0.014363971538841724, 0.014261215925216675, 0.018411457538604736, -0.05677283927798271, 0.02423180267214775, 0.00920246634632349, -0.04710778594017029, 0.02653053030371666, 0.05529223755002022, -0.07205642759799957, 0.0077055953443050385, 0.017028408125042915, -0.1033317819237709, -0.018502673134207726, -0.06907173991203308, -0.09629519283771515, -0.06829950213432312, 0.04676176235079765, 0.08083546161651611, 0.07947644591331482, 0.031142160296440125, -0.003275069175288081, 0.04311678186058998, -0.038452934473752975, 0.10158626735210419, 0.06379316002130508, 0.04244018346071243, 0.12740465998649597, -0.04329084977507591, -0.03352176025509834, 0.1430322527885437, 0.005586385261267424, -0.06289064139127731, 0.01647663675248623, -0.03881470113992691, -0.037994809448719025, -0.0104423388838768, 0.05055035278201103, 0.030872181057929993, 0.059466954320669174, 0.04202431067824364, 0.015978442505002022, 0.001922306139022112, -0.08214615285396576, 0.06723901629447937, -0.01804233342409134, 0.03081945702433586, -0.031171543523669243, -0.024219030514359474, -0.012550982646644115, -0.013289806433022022, -0.04917900636792183, 0.027304984629154205, 0.06573697179555893, -0.0016462535131722689, -0.06236813962459564, -0.10243328660726547, 0.08786706626415253, 0.05307278037071228, -0.04491499066352844, -0.07978733628988266, 0.054416246712207794, -0.009459326975047588, 0.026577623561024666, -0.02168523147702217, 0.08859270066022873, 0.08036281168460846, -0.007586614228785038, 0.0354529544711113, 0.04740643873810768, 0.013724509626626968, 0.03187670558691025, 0.0460701622068882, 0.006803266238421202]"
2,1,"Lehre in Aus-, Fort- und Weiterbildung im Bereich der Primarstufe mit Fokus auf Sprachliche Bildung und Inklusive Pädagogik",241.0,364.0,"[0.0819167047739029, 0.011704627424478531, 0.050741564482450485, -0.010205879807472229, -0.05134326592087746, 0.0038531916216015816, -0.04764701798558235, -0.012560436502099037, -0.011834846809506416, -0.022554954513907433, 0.011420183815062046, 0.02533380687236786, 0.014609644189476967, 0.042344626039266586, 0.07233414053916931, 0.041096098721027374, 0.040323156863451004, 0.05698573216795921, 0.04095861688256264, -0.10812367498874664, -0.052524078637361526, 0.02363300882279873, 0.04943254590034485, -0.005119250621646643, 0.018094230443239212, 0.016185522079467773, 0.05517258867621422, -0.02508898265659809, 0.10138726234436035, -0.06304381787776947, -0.0015330041060224175, -0.03202921524643898, 0.09479464590549469, 0.01936071179807186, -0.09707353264093399, 0.11855786293745041, 0.023839015513658524, 0.05589766800403595, -0.004337135702371597, -0.019433125853538513, -0.01875324174761772, -0.015181201510131359, 0.012774129398167133, 0.010578418150544167, 0.012772409245371819, -0.03658483549952507, -0.06441772729158401, -0.022415753453969955, -0.04301640763878822, -0.07892552018165588, -0.06882434338331223, -0.06779400259256363, -0.03386356681585312, 0.01984436623752117, -0.003227817127481103, -0.013183340430259705, 0.05536384880542755, 0.04798806458711624, -0.04068533703684807, 0.1257621943950653, -0.09279809147119522, 0.018114333972334862, -0.058151330798864365, 0.07283122837543488, -0.051116667687892914, 0.0018124091438949108, 0.06277855485677719, 0.08773430436849594, -0.06187755987048149, -0.06556416302919388, -0.02996714599430561, 0.01963702030479908, 0.03586500510573387, 0.07163318991661072, 0.00872043427079916, 0.052333664149045944, -0.025158071890473366, 0.030390851199626923, 0.09271109849214554, -0.04722039774060249, 0.0808282420039177, 0.04917918145656586, 0.05281111225485802, 0.022186117246747017, -0.00732843391597271, -0.039102911949157715, -0.026078302413225174, 0.02129213511943817, -0.031612057238817215, -0.05946900695562363, -0.006956068333238363, -0.11749029904603958, 0.04817081242799759, 0.06158638000488281, 0.05561216548085213, -0.08039437979459763, 0.051243264228105545, -0.07028917968273163, -0.05719394236803055, 0.08339965343475342, -0.019117701798677444, -0.026005735620856285, 0.014668150804936886, -0.004562326706945896, -0.028626808896660805, 0.03368265554308891, 0.02787255123257637, -0.015361608937382698, -0.016155635938048363, -0.04622082784771919, -0.01343696378171444, -0.03232363611459732, -0.07907470315694809, 0.02308366261422634, -0.015387414954602718, -0.021896973252296448, 0.11064129322767258, -0.02289493940770626, 0.036066342145204544, 0.07893404364585876, -0.04762997478246689, -0.004845150746405125, -0.004402070306241512, -0.09059909731149673, 0.019793467596173286, -0.06830944120883942, 0.00295927538536489, 0.025471197441220284, 0.015338337980210781, -0.019648801535367966, 0.05517064034938812, 0.018152914941310883, -0.017361419275403023, 0.09715709090232849, 0.012177834287285805, -0.04381309822201729, 0.01074229832738638, -0.02877286821603775, 0.03196956589818001, 0.0067679318599402905, -0.0012597779277712107, 0.07130324840545654, 0.02526308223605156, 0.043141260743141174, -0.028156131505966187, -0.006073142867535353, 0.005373967345803976, 0.0620092898607254, 0.05061887204647064, 0.014143751934170723, 0.013998298905789852, -0.014514841139316559, -0.00836625974625349, -0.059754159301519394, 0.01885821484029293, -0.054027583450078964, 0.06558497995138168, -0.011856322176754475, 0.017873480916023254, -0.029054097831249237, -0.10123211145401001, 0.0379335917532444, -0.015378455631434917, -0.026847437024116516, 0.06008788198232651, -0.016479136422276497, 0.0014863676624372602, -0.05619706213474274, 0.03315852954983711, -0.03966784477233887, 0.06490381062030792, 0.01238342933356762, 0.05281830206513405, 0.06696924567222595, 0.059699010103940964, -0.04989476874470711, -0.022788552567362785, 0.022454068064689636, -0.000621241400949657, -0.02846423164010048, -0.020210761576890945, -0.054913245141506195, 0.04019373655319214, 0.020504552870988846, -0.003162788227200508, 0.05203857645392418, 0.036601029336452484, -0.02861451543867588, 0.006222624331712723, 0.09706757217645645, 0.018261471763253212, 0.02227381244301796, -0.02208862639963627, -0.12425590306520462, -0.076535165309906, -0.020256606861948967, 0.08502890914678574, -0.14672736823558807, -0.09991216659545898, 0.022171739488840103, -0.05443263426423073, 0.04016571491956711, -0.026334505528211594, -0.007954690605401993, -0.01353525836020708, -0.03142353892326355, 0.11700717359781265, -0.007656186353415251, 0.02244364097714424, 0.052939653396606445, -0.012142623774707317, 0.0625884085893631, 0.02064821682870388, -0.01888570562005043, 0.001592096989043057, -0.028640341013669968, 0.0055245645344257355, 0.10043131560087204, -0.008404409512877464, 0.0596231073141098, -0.06265738606452942, -0.03337400034070015, 0.07319292426109314, -0.049314048141241074, -0.00039355148328468204, 0.07556749880313873, -0.10672838240861893, 0.05700067803263664, 0.04666387662291527, 0.01619655452668667, 0.02764930948615074, -0.014464757405221462, 0.031208526343107224, 0.04725388064980507, -0.12136486172676086, -0.013688282109797001, 0.1043042242527008, 0.06349769979715347, -0.05852261558175087, -0.008301048539578915, -0.006052905227988958, 0.08594071865081787, 0.015387428924441338, 0.02572087198495865, -0.03343237191438675, -0.013227866031229496, -0.0811508372426033, -0.059844594448804855, 0.03316442668437958, 0.0018746701534837484, -0.05487295240163803, -0.0018298933282494545, -0.07532425969839096, -0.03616033494472504, 0.09415622800588608, 0.006541152019053698, -0.03284381330013275, -0.02890009805560112, -0.07684466242790222, -0.004922738764435053, 0.01174926571547985, -0.1140836626291275, -0.05607767403125763, 0.1793939173221588, -0.013863283209502697, -0.040039949119091034, -0.058588169515132904, -0.07326159626245499, -0.064358651638031, -0.00045027537271380424, -0.06683376431465149, -0.003718186169862747, -0.0867341086268425, 0.010016359388828278, 0.001292381202802062, 0.031813185662031174, -0.028873588889837265, -0.11771842837333679, 0.012078778818249702, -0.0604066364467144, 0.05832614749670029, -0.01160014420747757, -0.02306780405342579, 0.011325000785291195, 0.05909382551908493, -0.020719872787594795, 0.02189817652106285, -0.0543900690972805, 0.08882454037666321, 0.06353919208049774, 0.04008051007986069, 0.035960715264081955, -0.002107322681695223, -0.025681791827082634, 0.030607091262936592, 0.016829511150717735, -0.0582091324031353, -0.03844963386654854, -0.016455108299851418, 0.10053476691246033, 0.05349329859018326, 0.00827337708324194, -0.05063888430595398, -0.013475305400788784, -0.04331636801362038, -0.05018264800310135, -0.044734712690114975, -0.0510188452899456, -0.04261287674307823, 0.09330884367227554, 0.0013683602446690202, -0.02400865964591503, 0.044080138206481934, -0.03242875263094902, -0.023630626499652863, 0.008973907679319382, -0.009704085066914558, -0.08341509848833084, 0.07142370939254761, -0.05626489222049713, -0.032280389219522476, -0.022011801600456238, 0.010382180102169514, -0.006822854746133089, -0.006095224991440773, -0.020825590938329697, -0.026661034673452377, -0.023425044491887093, -0.013197900727391243, 0.061813149601221085, -0.11157558113336563, -0.004388485569506884, -0.03912058845162392, 0.0012515163980424404, 0.016073551028966904, 0.05281124264001846, 0.04242997616529465, 0.007282544858753681, 0.053787317126989365, 0.023718377575278282, 0.07612887024879456, 0.029488300904631615, -0.04914981126785278, 0.04593172296881676, -0.10310098528862, -0.06342662870883942, 0.03247881308197975, 0.05541466549038887, -0.09795938432216644, 0.01655397191643715, 0.005912845954298973, 0.043238066136837006, -0.038544148206710815, -0.07242672145366669, 0.00768336933106184, -0.011617074720561504, 0.024710992351174355, -0.01609628275036812, 0.04914766177535057, 0.010603700764477253, 0.0031116283498704433, -0.11293335258960724, 0.07285218685865402, -0.03414008766412735, 0.022425945848226547, 0.05439665913581848, -0.05929771065711975, 0.03501312807202339, -0.05642462521791458, 0.02032184973359108, 0.02002600207924843, -0.06007690727710724, -0.004193013533949852, -0.011979267001152039, 0.09334713220596313, 0.04220543056726456, 0.024131037294864655, -0.030570561066269875, -0.04686930775642395, 0.10294365137815475, -0.016010800376534462, 0.04289080947637558, -0.039594683796167374, 0.0438046008348465]"
3,1,"Beratung von Studierenden, insbesondere Betreuung bei der Absolvierung der päda-gogisch-praktischen Studien und der Erstellung von Qualifizierungsarbeiten",367.0,521.0,"[0.025065844878554344, 0.08334314823150635, -0.030707743018865585, 0.02014520764350891, -0.05506227910518646, -0.015294376760721207, -0.03594242408871651, 0.0458063930273056, -0.019109932705760002, -0.007956106215715408, -0.029495758935809135, 0.03867299109697342, 0.010056722909212112, 0.042701512575149536, 0.05172894150018692, 0.002806236268952489, 0.04004071652889252, -0.01757856458425522, 0.06836696714162827, -0.008026717230677605, -0.09341733157634735, -0.01844867132604122, 0.026512349024415016, -0.0017347373068332672, -0.02887122705578804, -0.0180886872112751, 0.06731995195150375, -0.04994926601648331, 0.08198282122612, -0.05560477823019028, -0.024953806772828102, -0.008684593252837658, 0.019239269196987152, 0.00718076853081584, -0.06990993767976761, 0.12927092611789703, -0.05351535230875015, 0.0561944954097271, 0.011709085665643215, -0.006792018190026283, -0.03811165690422058, -0.025879766792058945, 0.019187171012163162, 0.0450466088950634, 0.019884809851646423, -0.0670221820473671, -0.005560188554227352, -0.004226699937134981, -0.0900982990860939, -0.03171101585030556, -0.10453562438488007, -0.09453190863132477, 0.015145855955779552, -0.07922444492578506, -0.0032741085160523653, 0.009502673521637917, 0.09860565513372421, -0.0023425829131156206, -0.06979108601808548, 0.08357550948858261, -0.02893473394215107, 0.016203412786126137, -0.1072760671377182, 0.05451689288020134, -0.06853951513767242, -0.02091164141893387, 0.018670281395316124, 0.07583007961511612, 0.025484703481197357, 0.0417977049946785, -0.05445994809269905, -0.03276055306196213, -0.0019709544721990824, 0.04746269807219505, 0.04259134829044342, 0.06574532389640808, -0.025050586089491844, 0.005476372316479683, 0.07420365512371063, -0.0642651915550232, 0.111943818628788, 0.042322270572185516, 0.05802399292588234, -0.016324931755661964, 0.027701588347554207, 0.005022305063903332, -0.05374545231461525, 0.1404913067817688, 0.04549000412225723, -0.03409072011709213, 0.07409916818141937, 0.0034958492033183575, -0.01557255256921053, 0.03686399385333061, 0.018937580287456512, -0.008723372593522072, 0.015231595374643803, -0.004684306215494871, 0.010789153166115284, 0.09784442186355591, -0.05449307709932327, 0.023737149313092232, 0.03831886127591133, -0.02036367356777191, -0.05749914050102234, 0.04052126780152321, 0.06958045810461044, -0.05657657980918884, 0.04217233881354332, 0.03819175809621811, -0.048365361988544464, 0.006058884784579277, -0.08555391430854797, -0.035920046269893646, -0.03147830069065094, 0.07200383394956589, 0.060803502798080444, 0.018446099013090134, 0.019153155386447906, 0.09641177952289581, -0.01687597669661045, -0.02892250195145607, 0.10352888703346252, -0.08507221192121506, 0.02043105475604534, -0.054819945245981216, -0.03418419137597084, 0.0190238319337368, -0.0015690678264945745, -0.062053270637989044, 0.06254424154758453, 0.06673968583345413, -0.05348489433526993, 0.0557364858686924, 0.005871279630810022, -0.050270926207304, 0.03331592306494713, -0.032435640692710876, -0.002971226815134287, 0.016395071521401405, 0.05974414199590683, 0.01197096984833479, 0.0020064404234290123, 0.09528861194849014, -0.026717375963926315, 0.017553232610225677, -0.04337528347969055, 0.09933240711688995, 0.10763422399759293, -0.017323195934295654, 0.08354225754737854, 0.024897539988160133, -0.03202051296830177, -0.022601906210184097, -0.010327676311135292, -0.006391649600118399, 0.031726330518722534, -0.01951129361987114, 0.04666405916213989, -0.058918144553899765, -0.08510469645261765, 0.023132801055908203, 0.0232792180031538, 0.01648075506091118, 0.019658731296658516, -0.04726020619273186, 0.01927603967487812, -0.05901065096259117, -0.023986121639609337, 0.002033868106082082, 0.047894932329654694, -0.04421856999397278, 0.023886065930128098, 0.028447525575757027, 0.046934355050325394, -0.032653432339429855, -0.021125292405486107, 0.07812506705522537, -0.0732739195227623, -0.0415327250957489, 0.06143476441502571, -0.029871413484215736, -0.018232107162475586, -0.008183781988918781, 0.010151686146855354, 0.007258541416376829, 0.000768075929954648, -0.07056056708097458, 0.01680670492351055, 0.049449510872364044, -0.09478326886892319, -0.03103303723037243, -0.007848812267184258, -0.07883929461240768, -0.035987429320812225, -0.011210246942937374, 0.063169926404953, -0.1537412852048874, -0.15125276148319244, 0.08191133290529251, -0.07650630921125412, -0.013869218528270721, -0.05037218704819679, -0.024739740416407585, 0.022182494401931763, 0.025242310017347336, 0.09436050802469254, -0.046194784343242645, 0.12823531031608582, -0.0028119352646172047, -0.022738954052329063, -0.02255367673933506, 0.05313638597726822, -0.011301840655505657, 0.03347454220056534, -0.008758685551583767, 0.0112101836130023, 0.07528204470872879, -0.011167585849761963, 0.025122445076704025, -0.03236934170126915, -0.005092309322208166, 0.06121617183089256, -0.08440563082695007, -0.06593804061412811, -0.026124263182282448, -0.044142432510852814, 0.029056845232844353, 0.08984369784593582, 0.003947832155972719, 0.0009301936952397227, -0.09135399758815765, 0.038797855377197266, 0.010536317713558674, -0.05738655477762222, -0.07630568742752075, 0.07524865120649338, 0.012925091199576855, -0.11818721145391464, -0.05346006155014038, -0.06138421967625618, 0.004726809915155172, -0.021465566009283066, -0.003117206273600459, -0.026741186156868935, 0.07023736089468002, 0.00733037618920207, -0.06636207550764084, 0.008451423607766628, -0.001532293390482664, 0.016109289601445198, -0.16234710812568665, -0.05434257164597511, 0.013045050203800201, 0.06806681305170059, 0.013541581109166145, -0.08453909307718277, -0.01119064912199974, -0.07459874451160431, 0.06664387881755829, 0.02894570492208004, 0.01718994788825512, -0.03429103642702103, 0.11787618696689606, 0.04357167333364487, -0.02592570334672928, -0.04010772705078125, -0.09751926362514496, 0.022024963051080704, 0.0114567456766963, -0.05899398401379585, -0.08190350979566574, 0.0007053854060359299, -0.019445421174168587, 0.02103421464562416, -0.025677766650915146, -0.0336071141064167, -0.04731827974319458, 0.08217908442020416, -0.00023185966711025685, 0.018515432253479958, -0.030672477558255196, -0.02111215703189373, 0.0068306876346468925, 0.006735877599567175, 0.0027679556515067816, 0.047738585621118546, -0.05087065324187279, -0.0011250098468735814, -0.011696935631334782, 0.00025119876954704523, 0.06235724687576294, -0.04405303671956062, -0.03224613144993782, 0.014175795949995518, -0.018905390053987503, -0.06590577214956284, -0.027485618367791176, 0.0036075341049581766, -0.007564548868685961, -0.009026953019201756, 0.007206310518085957, -0.03346299007534981, -0.02367323264479637, 0.017664730548858643, -0.08143961429595947, -0.0046566505916416645, 0.041659753769636154, -7.557859498774633e-05, 0.02474486641585827, 0.00505383824929595, -0.07736693322658539, 0.04499799758195877, -0.05911337956786156, -0.008226078003644943, -0.03310943394899368, 0.03447664901614189, -0.06665834039449692, 0.07379776984453201, -0.07776633650064468, -0.008735842071473598, -0.016080481931567192, -0.004304205067455769, 0.02862546406686306, -0.04087669774889946, 0.0496218204498291, -0.09187968820333481, -0.003959503024816513, 0.004680586978793144, 0.052023112773895264, -0.08238259702920914, -0.008728452026844025, -0.00678397947922349, 0.03660915046930313, 0.05253977328538895, 0.04632210358977318, 0.0532369464635849, 0.07519590109586716, 0.020439831539988518, 0.008043673820793629, 0.07986438274383545, -0.0018824671860784292, -0.041997943073511124, 0.019531842321157455, -0.04380191117525101, -0.02648239955306053, 0.014965553767979145, 0.060070235282182693, -0.07541466504335403, -0.02041848935186863, -0.07696752995252609, 0.06609726697206497, 0.03558531403541565, -0.08661433309316635, 0.0888194739818573, -0.024816563352942467, 0.01018509641289711, 0.046858664602041245, 0.05739200860261917, 0.040995121002197266, -0.0663604810833931, -0.011033748276531696, 0.07208810746669769, 0.04425719752907753, 0.02407854050397873, 0.037374481558799744, -0.08430131524801254, 0.04258349910378456, -0.04412326589226723, 0.07083349674940109, 0.018296193331480026, -0.005756919272243977, -0.0022852111142128706, -0.06902579963207245, 0.06297938525676727, 0.03476538136601448, 0.04984345659613609, 0.0012665798421949148, -0.08704320341348648, 0.05209099128842354, 0.040047865360975266, 0.04673423990607262, 0.011899447999894619, 0.06604034453630447]"
4,1,"Mitarbeit im Zentrum für Minderheitenschulwesen, Mehrsprachigkeit und Inklusion",524.0,603.0,"[0.09072640538215637, 0.05437076464295387, -0.034094952046871185, 0.007253492251038551, -0.034077104181051254, 0.02128671482205391, -0.015036596916615963, -0.1023382917046547, -0.015941748395562172, 0.0375838465988636, -0.0072065843269228935, -0.039128661155700684, 0.031466737389564514, -0.01744571141898632, 0.09334982186555862, 0.08835766464471817, 0.008920733816921711, 0.04380981624126434, -0.003460764419287443, -0.04820200800895691, -0.08840373903512955, -0.07428213953971863, -0.016913654282689095, -0.014568088576197624, 0.06347955763339996, -0.023403163999319077, 0.07308560609817505, -0.011247093789279461, 0.05574551597237587, -0.05926123633980751, 0.07476767897605896, -0.01442954782396555, 0.10528726875782013, 0.05222684144973755, -0.09009901434183121, 0.06259007751941681, 0.06704307347536087, 0.04727441072463989, -0.014429586939513683, -0.027781426906585693, -0.006535330321639776, -0.029164213687181473, 0.04347213730216026, 0.052330534905195236, -0.0002466832520440221, -0.01796000450849533, -0.11127596348524094, -0.006760089658200741, -0.07479553669691086, -0.0986766666173935, -0.008099252358078957, -0.022354882210493088, -0.010642977431416512, -0.011125153861939907, -0.01591949723660946, 0.024692688137292862, 0.004153016954660416, 0.020417815074324608, 0.022614501416683197, 0.059867944568395615, -0.002777502406388521, 0.014840304851531982, -0.05326820909976959, 0.08844057470560074, -0.03685217350721359, -0.04256097227334976, 0.04886310175061226, 0.03395989164710045, -0.033366795629262924, -0.06360920518636703, 0.027066396549344063, 0.02138255164027214, -0.0018702795496210456, 0.04691118746995926, 0.0579538457095623, 0.05858033150434494, 0.007366383448243141, 0.0440916083753109, 0.03055906854569912, -0.04494057595729828, 0.03284205123782158, 0.07430122792720795, 0.06676912307739258, -0.008642596192657948, 0.04080353304743767, -0.02434062585234642, -0.047123413532972336, -0.0034594316966831684, 0.015621693804860115, -0.020550012588500977, -0.08238454163074493, 0.046319808810949326, 0.07664595544338226, -0.020653018727898598, 0.04716106131672859, -0.0581778958439827, -0.009924951009452343, -0.041508179157972336, 0.018902335315942764, 0.10532650351524353, -0.02421959489583969, 0.004748123697936535, 0.0557200126349926, -0.009245430119335651, -0.08110563457012177, 0.02690960466861725, 0.07448101788759232, -0.017952093854546547, -0.029331665486097336, 0.021590324118733406, -0.05329267308115959, -0.04296166077256203, -0.07438566535711288, 0.024496957659721375, -0.029612237587571144, -0.00027080715517513454, 0.08681810647249222, -0.02211342565715313, 0.021565986797213554, 0.05600661784410477, -0.0996406078338623, 0.07266078144311905, -0.03972902521491051, -0.08017429709434509, 0.0677461251616478, -0.010372756980359554, 0.021210387349128723, 0.018858125433325768, 0.009951292537152767, 0.0275823213160038, -0.04980645701289177, 0.06716509163379669, 0.024204200133681297, 0.06271519511938095, 0.057149361819028854, -0.061499543488025665, -0.01874471642076969, -0.02282790094614029, 0.025632984936237335, -0.003779298858717084, 0.06963823735713959, 0.05372496321797371, -0.016754725947976112, 0.05043651536107063, 0.008829483762383461, -0.015787264332175255, -0.08470199257135391, 0.07034894824028015, 0.048734817653894424, 0.039675042033195496, 0.023990007117390633, 0.07022061198949814, -0.047735050320625305, 0.0037557194009423256, -0.03135794773697853, -0.005909515079110861, 0.1416018158197403, -0.0023032850585877895, 0.021290089935064316, 0.03107856586575508, -0.021300379186868668, 8.470646207570098e-06, 0.04132184386253357, -0.013576461933553219, 0.005777429789304733, -0.018831392750144005, -0.002990021603181958, -0.019031204283237457, -0.008419342339038849, -0.049465108662843704, 0.02223903313279152, 0.006700742058455944, 0.11230996251106262, 0.0443967767059803, 0.009249724447727203, -0.08011898398399353, -0.008012844249606133, 0.13506446778774261, -0.030459629371762276, -0.06291542947292328, -0.02897367998957634, -0.03986864164471626, -0.011578009463846684, -0.041825875639915466, -0.012703537940979004, 0.06606031209230423, 0.06182306259870529, -0.06534183770418167, 0.013399861752986908, -0.001242614584043622, -0.048492975533008575, 0.023473700508475304, 0.06279762834310532, -0.07382060587406158, -0.06140836328268051, 0.017975568771362305, 0.026842953637242317, -0.2070072591304779, -0.0023835671599954367, 0.03495865315198898, -0.08742481470108032, 0.06002727895975113, -0.09310834109783173, 0.034626904875040054, 0.02058139070868492, -0.02778572216629982, 0.1141572967171669, 0.009233933873474598, 0.03155636787414551, 0.07534947246313095, 0.003920416813343763, -0.04471937194466591, -0.05921618267893791, -0.031224187463521957, -0.002823868300765753, -0.001801537349820137, 0.01731332391500473, 0.09355054795742035, -0.0258422140032053, 0.043531108647584915, -0.05285406857728958, -0.03272064030170441, 0.02106986567378044, -0.06953305006027222, -0.03084987960755825, -0.0010703668231144547, -0.05644519627094269, 0.00986156240105629, 0.01597099006175995, 0.055860307067632675, 0.0030241874046623707, -0.06437171250581741, 0.049008410423994064, 0.09226864576339722, -0.008697078563272953, -0.0964953750371933, 0.15995220839977264, -0.009837348945438862, -0.14420032501220703, 0.007117702160030603, 0.024819206446409225, 0.08710440993309021, 0.01737465336918831, 0.004091640003025532, -0.025002310052514076, -0.00723612867295742, -0.0055801295675337315, 0.04320484399795532, -0.06444932520389557, 0.03272964805364609, 0.014293975196778774, -0.1402660310268402, -0.0355449877679348, -0.03456685692071915, 0.042782265692949295, -0.05158279836177826, -0.07103665173053741, -0.05232413858175278, 0.020032288506627083, -0.04597029834985733, -0.06132573261857033, -0.02847585640847683, -0.08883693069219589, 0.10856068879365921, 0.0310528427362442, -0.004627462476491928, -0.07554849982261658, -0.015637947246432304, 0.02817779779434204, 0.06394975632429123, -0.03410211205482483, 0.03235388174653053, -0.08629975467920303, -0.039184119552373886, -0.03678091615438461, 0.006179116200655699, 0.009992427192628384, -0.0633288249373436, 0.08435998111963272, 0.02552289515733719, 0.011705286800861359, 0.00026614818489179015, -0.04438457265496254, 0.011554607190191746, 0.00784205924719572, 0.05967371538281441, -0.01786377653479576, 0.0062467134557664394, 0.06264201551675797, 0.07177279889583588, 0.014462173916399479, -0.005425712559372187, 0.019866621121764183, -0.0036732666194438934, 0.02593991905450821, 0.016104694455862045, -0.05388273298740387, -0.04765523225069046, -0.0621272549033165, 0.046918854117393494, 0.057216744869947433, 0.05605144426226616, -0.048892393708229065, -0.024404844269156456, -0.04588034003973007, -0.08711011707782745, 0.007061363663524389, -0.03837429732084274, 0.012657762505114079, 0.03552339971065521, 0.017172543331980705, -0.050802938640117645, 0.0723891630768776, -0.04018077999353409, -0.06082099303603172, -0.012529764324426651, -0.01801363006234169, -0.03903497755527496, 0.0762910321354866, -0.09792489558458328, 0.04155239090323448, -0.04482341185212135, -0.1034618616104126, -0.0019009177340194583, 0.0011305335210636258, -0.0014587320620194077, -0.028242940083146095, -0.0723799541592598, 0.0007046940736472607, 0.14205272495746613, -0.06120891496539116, -0.044515449553728104, -0.05703006312251091, -0.033534593880176544, 0.023598166182637215, 0.013632141053676605, -0.002243900904431939, 0.0064263492822647095, 0.032501861453056335, 0.007768957410007715, 0.029885783791542053, -0.0060872770845890045, -0.009924065321683884, 0.014952708035707474, -0.048981864005327225, -0.07219178229570389, -0.06738822162151337, -0.028052760288119316, -0.07875845581293106, -0.03597993403673172, 0.0005317198229022324, 0.034351617097854614, -0.02513025514781475, -0.06452243775129318, -0.017874646931886673, 0.025228876620531082, -0.02275875210762024, 0.03708307445049286, 0.07623682916164398, -0.026261433959007263, -0.014846713282167912, 0.006576885469257832, 0.02089112251996994, 0.0017304752254858613, 0.032937049865722656, 0.016990669071674347, -0.08073487877845764, 0.05322425067424774, -0.0630451962351799, -0.002386352512985468, -0.04442332312464714, 0.014628070406615734, -0.004182504490017891, 0.037654440850019455, 0.08466149866580963, -0.04443548247218132, 0.03969821333885193, 0.034204497933387756, -0.03900252282619476, 0.023520581424236298, 0.05389050394296646, 0.04856599122285843, -0.039504531770944595, 0.04686565324664116]"


### Phrase Extraction

In [27]:
#extract the phrases
phrases = []

#iterate through each row in the data frame 
for i in range(len(df)):
    text = df.loc[i, "text_clean"]
    job_id_value = df.loc[i, id_col]

    phs = extract_phrases(
        text,
        max_candidates = C.KEYBERT_MAX_CANDIDATES,
        score_cutoff = C.KEYBERT_SCORE_CUTOFF
    )
    #save the phrase into a tuple
    for item in phs:
        surface = item["phrase_surface"]

        #we allow fuzzy matching here because the surface is normalized (stopwords/lemma/spacing)
        start, end = find_span_in_text(text, surface, allow_fuzzy=True, min_tokens_found=1)

        phrases.append((
            job_id_value,
            surface,
            item["phrase_lemma"],
            item["score"],
            item["pos_signature"],
            start,
            end
        ))

print("Total phrases extracted:", len(phrases))

Total phrases extracted: 7668


*Below are some statistics describing the extracted phrases.*

In [29]:
pos_info = {}

for i in range(len(phrases)): #we iterate through the tuple and count the occurrences of each POS tag
    job_id_value, surface, lemma, score, pos_sig, start, end = phrases[i]

    if pos_sig not in pos_info:
        pos_info[pos_sig] = {"count": 0, "sum_score": 0.0}
        
    pos_info[pos_sig]["count"] += 1
    pos_info[pos_sig]["sum_score"] += float(score)

pos_rows = [] #collect the counts and scores (+avg) and store them
for pos_sig in pos_info:
    count = pos_info[pos_sig]["count"]
    avg_score = pos_info[pos_sig]["sum_score"] / count
    pos_rows.append([pos_sig, count, avg_score])

pos_stats = pd.DataFrame(
    pos_rows,
    columns=["POS", "n_phrases", "avg. score"]
)

display(pos_stats)

Unnamed: 0,POS,n_phrases,avg. score
0,ADJ NOUN,2391,0.480627
1,VERB NOUN,770,0.474442
2,NOUN VERB,1926,0.482492
3,NOUN NOUN,2246,0.473721
4,NOUN ADJ,335,0.463773


In [31]:
phrase_counts = {}

for item in phrases:
    job_id_value = item[0]
    if job_id_value not in phrase_counts:
        phrase_counts[job_id_value] = 0
    phrase_counts[job_id_value] += 1

counts = []
for job_id_value in phrase_counts:
    counts.append(phrase_counts[job_id_value])

jobs_with_phrases = len(phrase_counts)
min_phr_per_job = min(counts)
max_phr_per_job = max(counts)
avg_phr_per_job = round(sum(counts)/len(counts),2)

phr_job_summary = pd.DataFrame({
    "": [
        "jobs_with_phrases",
        "min_phrases_per_job",
        "avg_phrases_per_job",
        "max_phrases_per_job",
    ],
    "value": [
        jobs_with_phrases,
        min_phr_per_job,
        avg_phr_per_job,
        max_phr_per_job,
    ],
})

print("Phrase count per job (distribution summary)")
display(phr_job_summary)


Phrase count per job (distribution summary)


Unnamed: 0,Unnamed: 1,value
0,jobs_with_phrases,371.0
1,min_phrases_per_job,1.0
2,avg_phrases_per_job,20.67
3,max_phrases_per_job,72.0


In [33]:
score_values = []
for item in phrases:
    score_values.append(float(item[3]))

min_score = min(score_values)
max_score = max(score_values)
avg_score = sum(score_values) / len(score_values)

score_summary = pd.DataFrame({
    "": ["min_score", "avg_score", "max_score"],
    "value": [min_score, avg_score, max_score],
})

print("KeyBERT score statistics (all extracted phrases)")
display(score_summary)

KeyBERT score statistics (all extracted phrases)


Unnamed: 0,Unnamed: 1,value
0,min_score,0.3
1,avg_score,0.477715
2,max_score,0.8838


### Embed Phrases and Load to SQL
Here we embed in batches as well

In [36]:
parts = []

if len(phrases) > 0:
    start = 0 #same logic as for the unit embedding
    while start < len(phrases):
        end = start + C.EMBED_BATCH_SIZE
        batch = phrases[start:end]

        job_ids = []
        surfaces = []
        lemmas = []
        kb_scores = []
        pos_sigs = []
        texts = []
        phrase_starts = []
        phrase_ends = []

        for item in batch:
            job_id_value = item[0]
            surface = item[1]
            lemma = item[2]
            kb_score = item[3]
            pos_sig = item[4]
            p_start = item[5]
            p_end = item[6]

            job_ids.append(job_id_value)
            surfaces.append(surface)
            lemmas.append(lemma)
            kb_scores.append(kb_score)
            pos_sigs.append(pos_sig)
            texts.append(surface)   #we will embed the surface text because transformers are usually not trained on lemmatized versions, but on natural language
            phrase_starts.append(p_start)
            phrase_ends.append(p_end)

        vectors = embed_texts(texts)

        embedding_json_list = []
        for v in vectors:
            embedding_json_list.append(as_json(v))

        temp = pd.DataFrame({
            id_col: job_ids,
            "phrase_surface": surfaces,
            "phrase_lemma": lemmas,
            "KeyBert score": kb_scores,
            "pos_signature": pos_sigs,
            "phrase_start": phrase_starts,
            "phrase_end": phrase_ends,
            "embedding_json": embedding_json_list
        })
        parts.append(temp)
        start = end
        
    df_phrases = pd.concat(parts, ignore_index=True)

else:
    #in case no phrases extracted (just in case)
    df_phrases = pd.DataFrame(columns=[
        id_col,
        "phrase_surface",
        "phrase_lemma",
        "KeyBert score",
        "pos_signature",
        "phrase_start",
        "phrase_end",
        "embedding_json",
    ])


df_to_sqlite(df_phrases, sqlite_out, "job_phrases")
print("Saved", len(df_phrases))
print("Preview of phrase embeddings:")
display(df_phrases.head(5))


Saved 7668
Preview of phrase embeddings:


Unnamed: 0,job_id,phrase_surface,phrase_lemma,KeyBert score,pos_signature,phrase_start,phrase_end,embedding_json
0,1,pädagogischen hochschule,pädagogisch hochschule,0.7235,ADJ NOUN,83,107,"[0.08886658400297165, 0.04389321058988571, 0.004177523776888847, 0.009140496142208576, -0.024998676031827927, -0.0493110790848732, -0.07320988923311234, -0.005590064916759729, 0.004249081015586853, 0.02021803706884384, 0.010085003450512886, 0.005352774169296026, -0.007898133248090744, 0.019722217693924904, 0.006570129189640284, 0.025265365839004517, 0.03993462771177292, 0.05247011035680771, 0.06347435712814331, -0.014021459966897964, -0.011608550325036049, -0.004045360721647739, 0.03633054345846176, -0.008103524334728718, 0.009458040818572044, -0.007773444522172213, 0.01670166477560997, -0.06199166178703308, 0.020521046593785286, -0.09302502125501633, -0.004385611042380333, -0.0640878975391388, 0.1117168664932251, 0.043662093579769135, -0.06906013190746307, 0.10294963419437408, 0.029044950380921364, 0.03927764296531677, 0.022929439321160316, 0.002892559627071023, 0.0014327246462926269, -0.015404749661684036, 0.043958451598882675, 0.059603262692689896, 0.01976848393678665, -0.0496046356856823, -0.05371393263339996, -0.023280804976820946, -0.02813876047730446, -0.0508967749774456, -0.04311163350939751, -0.05935559421777725, -0.027102092280983925, -0.019110308960080147, -0.02093793824315071, 0.059502702206373215, 0.07215677946805954, 0.025003444403409958, -0.036925606429576874, 0.0703204870223999, -0.08660779893398285, 0.08249450474977493, -0.09051781892776489, 0.020047621801495552, -0.014861294068396091, -0.018708722665905952, 0.025993220508098602, 0.09622844308614731, -0.033125534653663635, 0.025416698306798935, -0.019841881468892097, -0.02572237141430378, 0.02104201167821884, 0.08860278129577637, 0.10325151681900024, 0.05526812747120857, -0.007918402552604675, 0.003223501145839691, 0.07824474573135376, -0.036692067980766296, 0.07825774699449539, -0.034966979175806046, 0.04154003784060478, -0.018108967691659927, 0.05008259415626526, -0.015415730886161327, -0.05544942244887352, 0.03371095284819603, 0.03927621245384216, -0.0564696229994297, 0.06911662220954895, -0.09946059435606003, -0.013548433780670166, -0.016687363386154175, 0.03466803580522537, -0.009639467112720013, -0.008068891242146492, -0.0822516605257988, 0.02553650178015232, 0.2487506866455078, -0.06943530589342117, 0.00032247943454422057, 0.024447690695524216, -0.052896127104759216, -0.03899287059903145, -0.0016642088303342462, 0.03312976658344269, -0.06096198037266731, -0.006542819086462259, 0.009690842591226101, 0.009690293110907078, -0.046739693731069565, -0.025907939299941063, 0.04010085016489029, 0.01815011166036129, 0.02019542083144188, 0.038363758474588394, -0.0035064909607172012, 0.050827063620090485, 0.05459156259894371, -0.03247755393385887, 0.007961188443005085, 0.028790690004825592, -0.10968540608882904, -0.003701247740536928, -0.05693183094263077, -0.01080945786088705, 0.06606259942054749, 0.003458367194980383, 0.0012168538523837924, 0.026236267760396004, 0.032925862818956375, -0.016489684581756592, 0.04059628024697304, 0.0171440951526165, -0.02167695201933384, 0.01730439066886902, 0.019123578444123268, 0.043695852160453796, -0.008981560356914997, -0.008198041468858719, 0.08555855602025986, 0.017099102959036827, 0.026993226259946823, -0.07639012485742569, 0.010646662674844265, 0.0024693352170288563, 0.04580925032496452, 0.04561001434922218, 0.01936582289636135, -0.004633407108485699, -0.04492301866412163, -0.028721673414111137, -0.026048503816127777, -0.02227824553847313, -0.004211827181279659, 0.07424670457839966, 0.002377767115831375, 0.08786282688379288, 0.001895242603495717, -0.11180757731199265, 0.04251182824373245, 0.08192224055528641, 0.001772110816091299, 0.07433883845806122, -0.024222513660788536, 0.052102331072092056, -0.062335237860679626, -0.02098982408642769, 0.0044898404739797115, 0.11562443524599075, 0.008887888863682747, 0.06102479249238968, 0.0867815613746643, 0.04787823185324669, -0.040627118200063705, -0.047747086733579636, 0.046747349202632904, -0.027797836810350418, -0.061953235417604446, -0.014655104838311672, -0.05402836203575134, 0.02671177312731743, -0.009065412916243076, 0.04100792109966278, 0.05869594216346741, 0.01567234843969345, -0.06898593157529831, 0.021781694144010544, 0.09244220703840256, -0.06790261715650558, 0.03252942115068436, -0.04687122628092766, -0.13867239654064178, -0.08525916188955307, -0.0007245547021739185, 0.13514308631420135, -0.1339460164308548, -0.040355946868658066, 0.018712621182203293, -0.07262509316205978, -0.029138918966054916, -0.025316176936030388, -0.01389290951192379, -0.017323486506938934, -0.03892070800065994, 0.07737334817647934, -0.003710737219080329, 0.08578863739967346, 0.01557034533470869, -0.013198627158999443, -0.014700750820338726, 0.0445454977452755, -0.010287335142493248, -0.02771768905222416, 0.013618707656860352, 0.029014186933636665, 0.04059566557407379, -0.06483276188373566, 0.015123086981475353, -0.01586727984249592, 0.014205138199031353, 0.009036018513143063, -0.10204578936100006, 0.03354828804731369, 0.001679093111306429, -0.0728565901517868, 0.09199235588312149, 0.045978303998708725, 0.007503332104533911, 0.0039332564920187, -0.016648445278406143, 0.023504815995693207, 0.02686258777976036, -0.0556233711540699, -0.046894289553165436, 0.07963494956493378, 0.033117059618234634, -0.06824000924825668, -0.06862614303827286, -0.018262041732668877, -0.0066177016124129295, -0.05275586619973183, 0.020825956016778946, 0.025877516716718674, -0.002750436309725046, -0.05251128971576691, 0.052066195756196976, 0.04330794885754585, -0.01611967384815216, -0.07948920130729675, -0.05314834043383598, -0.07830043137073517, -0.01772821694612503, 0.03073103353381157, 0.02271948754787445, 0.018395761027932167, 0.013317039236426353, -0.03532426059246063, -0.01917501538991928, 0.04091418534517288, -0.060903001576662064, -0.06405656784772873, 0.06297214329242706, 0.03397928550839424, -0.08869841694831848, -0.02249537594616413, -0.016807667911052704, -0.005755979102104902, 0.05861669033765793, -0.06550624966621399, 0.015062117017805576, -0.010138369165360928, 0.0018991061951965094, -0.08488164842128754, -0.016263315454125404, -0.025543952360749245, -0.08961132168769836, 0.07179040461778641, -0.03486661985516548, -0.010984097607433796, -0.03196669742465019, -0.009510006755590439, 0.04764510691165924, -0.002807531040161848, -0.031057259067893028, 0.020156254991889, -0.000958435470238328, 0.03465761989355087, 0.04004582390189171, 0.019389383494853973, 0.04467185586690903, -0.119074746966362, 0.047127865254879, 0.037253767251968384, 0.02196703851222992, 0.01761716604232788, -0.05216206982731819, -0.06627332419157028, 0.07088242471218109, 0.047605209052562714, 0.05021882802248001, -0.05976787209510803, -0.013836820609867573, 0.00504270801320672, -0.05843620002269745, -0.07276444882154465, -0.006214868742972612, -0.052176155149936676, 0.027937792241573334, 0.0021066300105303526, -0.05565160512924194, 0.06730850040912628, -0.0485495999455452, 0.0028694469947367907, -0.010822814889252186, -0.005951135419309139, -0.1197265237569809, 0.03278015926480293, -0.12040872871875763, -0.043355491012334824, -0.007074709050357342, -0.062109481543302536, 0.0804600715637207, -0.022525573149323463, -0.005309154745191336, -0.005717085674405098, -0.0069636572152376175, 0.04304972290992737, -0.010834415443241596, -0.08663048595190048, -0.010217051021754742, -0.06640327721834183, -0.015487278811633587, 0.10414568334817886, 0.026701590046286583, 0.004394921008497477, 0.021973149850964546, 0.03589517995715141, 0.014042814262211323, 0.05151969939470291, 0.02051812782883644, -0.026372155174613, 0.02130242809653282, -0.07777830213308334, -0.030854418873786926, -0.01904470846056938, 0.007160894572734833, -0.05591142922639847, 0.02964373305439949, -0.046803783625364304, 0.0007659680559299886, -0.03914957866072655, -0.10468760877847672, 0.06198909506201744, 0.04895719140768051, 0.010683487169444561, 0.011444692499935627, 0.08962144702672958, -0.0397341288626194, -0.03602517768740654, -0.06478030979633331, 0.03806443139910698, 0.027116000652313232, 0.04041929915547371, 0.05936369672417641, -0.07406376302242279, 0.09313775599002838, -0.005263426806777716, 0.04648634418845177, -0.014091141521930695, 0.045223671942949295, 0.0010832638945430517, -0.14776553213596344, 0.07705243676900864, 0.04352329671382904, 0.03727880120277405, -0.05652656778693199, -0.12162374705076218, 0.02683151885867119, 0.08840420842170715, -0.030618080869317055, -0.00917731411755085, 0.03616143390536308]"
1,1,bereichen lehre,bereich lehre,0.7183,VERB NOUN,228,246,"[0.06694944947957993, -0.010488499887287617, -0.0068045188672840595, 0.03013945184648037, -0.017793135717511177, 0.00671760831028223, -0.02920297533273697, -0.007813587784767151, -0.0014119630213826895, 0.022306472063064575, -0.009351099841296673, 0.06241345405578613, -0.01599767990410328, 0.05353011190891266, -0.03535172715783119, 0.03828515484929085, 0.010768609121441841, 0.04853147640824318, 0.025090912356972694, -0.04531581327319145, -0.041020214557647705, 0.03619374334812164, 0.02712087519466877, -0.02644937112927437, -0.016203828155994415, -0.022358160465955734, 0.007860764861106873, -0.0605543777346611, 0.04741206020116806, -0.09072019904851913, -0.04150767996907234, -0.10670237988233566, 0.10325223952531815, 0.03461853042244911, -0.07269406318664551, 0.09763777256011963, 0.012576302513480186, 0.11405922472476959, 0.011264177039265633, -0.005869379732757807, 0.017488954588770866, -0.0008500737603753805, 0.02487780526280403, 0.06885672360658646, -0.007778307422995567, -0.06618016958236694, -0.0641251653432846, 0.0027364129200577736, -0.024190733209252357, -0.057822100818157196, -0.0611296109855175, -0.05140291899442673, -0.02127901278436184, 0.009573673829436302, -0.0448315404355526, 0.002237096894532442, 0.07361894845962524, 0.041353534907102585, -0.018806092441082, 0.09526606649160385, -0.08047086745500565, 0.035723231732845306, -0.08497606962919235, 0.04936792701482773, -0.025490760803222656, 0.018196487799286842, 0.003153992583975196, 0.0377269983291626, -0.018893172964453697, 0.011975356377661228, -0.001864921418018639, -0.014372356235980988, -0.0030627588275820017, 0.06515280157327652, 0.035698506981134415, -0.010312940925359726, -0.0032860415522009134, -0.0018101067980751395, 0.08321654051542282, -0.043256063014268875, 0.023636799305677414, -0.0029131551273167133, 0.056877754628658295, 0.023404069244861603, -0.012949036434292793, 0.0023779654875397682, -0.053603533655405045, 0.05500512570142746, 0.018290698528289795, -0.04398122429847717, 0.08175364136695862, -0.06952936947345734, 0.03214120864868164, -0.018541814759373665, 0.036216143518686295, -0.02169312909245491, 0.029459349811077118, -0.04616704210639, -0.03676418960094452, 0.27668994665145874, -0.07508493959903717, -0.02332473173737526, 0.05115782842040062, -0.037501297891139984, -0.04623858258128166, 0.02535938285291195, -0.0011743856593966484, -0.0714726597070694, -0.0445752888917923, -0.026673460379242897, 0.00878053717315197, -0.03683558106422424, -0.053838279098272324, 0.03873222693800926, 0.05364169552922249, -0.0020463159307837486, 0.04931384697556496, 0.01898667775094509, -0.014403492212295532, 0.04757045954465866, -0.0052812728099524975, 0.02603308856487274, 0.007467329502105713, -0.0887780487537384, 0.027287492528557777, -0.1334933489561081, -0.01364968903362751, 0.04693001136183739, 0.03325715288519859, 0.027613861486315727, 0.004372209310531616, 0.06698673963546753, -0.011122593656182289, 0.056960515677928925, 0.011187938041985035, -0.000781387323513627, 0.01791497692465782, 0.03331027552485466, 0.025009848177433014, -0.020221369341015816, -0.014501865021884441, 0.05012228712439537, -0.07630865275859833, 0.020678559318184853, -0.002948144916445017, -0.03546653687953949, 0.015048959292471409, 0.04543237015604973, 0.029125045984983444, 0.05426549166440964, -0.014265630394220352, -0.027037134394049644, -0.027529099956154823, -0.02185605838894844, -0.0025568497367203236, 0.008366354741156101, 0.05389949679374695, -0.027366308495402336, 0.07248716801404953, -0.03847713768482208, -0.07740655541419983, 0.028262818232178688, 0.026846129447221756, -0.052885472774505615, 0.04420769214630127, -0.012825756333768368, 0.06946097314357758, -0.07438217103481293, 0.003243923420086503, -0.022229788824915886, 0.08736011385917664, -0.006983515340834856, 0.05580342188477516, 0.07702810317277908, 0.027393938973546028, -0.03278990462422371, -0.038897112011909485, 0.06463967263698578, 0.014711616560816765, -0.004880896769464016, 0.04746362939476967, -0.015572011470794678, 0.05153078958392143, -0.0342707484960556, 0.048399195075035095, 0.09576751291751862, -0.015585147775709629, -0.02466200292110443, 0.015970060601830482, 0.06195979565382004, -0.018990298733115196, 0.047079138457775116, -0.050130609422922134, -0.1585555523633957, -0.09350284934043884, -0.04422163963317871, 0.09100773930549622, -0.11247603595256805, -0.06845942884683609, 0.06532272696495056, -0.0871632993221283, -0.001597230089828372, -0.02384728193283081, -0.03983842954039574, -0.019020672887563705, -0.0784122496843338, 0.02054436504840851, 0.025743594393134117, 0.03056809864938259, 0.046665437519550323, 0.015622622333467007, 0.0242482740432024, 0.03756486251950264, -0.041756611317396164, -0.02242458239197731, 0.06234574690461159, 0.059480126947164536, 0.09616103768348694, -0.008014230988919735, 0.05284048989415169, -0.027379339560866356, -0.026804352179169655, 0.04310497269034386, -0.11425337195396423, -0.01662486605346203, -0.0145493745803833, -0.0689263865351677, 0.09120269864797592, 0.029106786474585533, -0.011049006134271622, 0.004312373697757721, -0.03830898553133011, 0.031487442553043365, -0.04938960447907448, -0.08755600452423096, -0.09613122791051865, 0.05145184323191643, 0.028923705220222473, -0.0850331038236618, -0.006794235669076443, -0.05246295407414436, -0.0037996137980371714, -0.017453016713261604, 0.03300710767507553, 0.022874416783452034, 0.03139341622591019, -0.03444148972630501, 0.03566000610589981, 0.022368542850017548, -0.02721402794122696, -0.02124716341495514, -0.018018048256635666, -0.09869227558374405, -0.0309238750487566, 0.013587522320449352, -0.024757809937000275, 0.05451402813196182, -0.005846146959811449, -0.07075397670269012, 0.011875750496983528, 0.043650753796100616, -0.020480602979660034, -0.018253283575177193, 0.11565522849559784, 0.030533332377672195, -0.13322125375270844, -0.06722217053174973, -0.028534453362226486, -0.05960434302687645, 0.012072774581611156, -0.030052589252591133, -0.027820345014333725, 0.021461013704538345, 0.023301919922232628, -0.07171861827373505, -0.03065916709601879, -0.03396570309996605, -0.12059129029512405, 0.06077254191040993, -0.03761109337210655, 0.03714260458946228, -0.07579927146434784, 0.04127167537808418, 0.001888952450826764, -0.004907168447971344, -0.048837579786777496, 0.023158911615610123, -0.037641219794750214, -0.008586830459535122, 0.05790529027581215, 0.03073178045451641, 0.10286928713321686, -0.0797405019402504, 0.018839679658412933, 0.042256031185388565, 0.03395635634660721, 0.0023408811539411545, -0.0062070260755717754, -0.04764106869697571, 0.10678249597549438, 0.018483024090528488, -0.04975130409002304, -0.09807836264371872, -0.04373373091220856, 0.005784857552498579, -0.0622028149664402, 0.014048661105334759, -0.005434119142591953, -0.04574497044086456, 0.034560635685920715, 0.007041418459266424, -0.04840464144945145, 0.049151912331581116, -0.01463485136628151, 0.01620737463235855, -0.008862129412591457, 0.03187558799982071, -0.09809505194425583, 0.04472862556576729, -0.1066879853606224, -0.0177885964512825, -0.015116846188902855, -0.03323640301823616, -0.015188234858214855, 0.049424268305301666, -0.0008849463192746043, -0.04088450223207474, 0.01886298693716526, 0.014950595796108246, 0.05628528445959091, -0.05639426037669182, -0.02549615129828453, 0.0005975181120447814, 0.03301529958844185, 0.06726203858852386, 0.05583488568663597, -0.01665237918496132, 0.0479644313454628, 0.001540954108349979, 0.018091809004545212, 0.09645836055278778, 0.0155542753636837, -0.024937273934483528, 0.05872337520122528, -0.06592713296413422, -0.06009545177221298, -0.040195614099502563, 0.07554362714290619, -0.06923168152570724, 0.08026647567749023, -0.027100082486867905, 0.023030685260891914, -0.012735007330775261, -0.10693450272083282, 0.007303004618734121, 0.021752748638391495, -0.023794183507561684, -0.05070238560438156, 0.06486805528402328, 0.04776119813323021, -0.043739091604948044, 0.0029410128481686115, 0.06335993856191635, 0.027696577832102776, 0.01190115325152874, 0.014422732405364513, -0.05733410269021988, 0.08525995910167694, -0.02439979650080204, 0.06843572109937668, -0.016701480373740196, 0.06824495643377304, 0.02434985339641571, -0.09453707933425903, 0.09898494184017181, -0.031845517456531525, 0.07473299652338028, -0.058903541415929794, -0.06976912915706635, 0.06517872214317322, -0.030632860958576202, 0.037782490253448486, 0.020696289837360382, 0.0036586918868124485]"
2,1,zentrum minderheitenschulwesen,zentrum minderheitenschulwesen,0.6921,NOUN VERB,537,571,"[0.106541208922863, 0.07459547370672226, -0.06118697673082352, 9.66582665569149e-05, -0.0021776140201836824, 0.010109941475093365, -0.047376006841659546, -0.02676333673298359, -0.000973053218331188, 0.06460075825452805, -0.007900549098849297, -0.012783864513039589, 0.03763039782643318, 0.0010952242882922292, 0.020111141726374626, 0.03525778278708458, 0.01239048782736063, 0.05427194759249687, 0.08478965610265732, 0.018743757158517838, -0.041605547070503235, -0.05908990651369095, 0.0006644406239502132, -0.030131759122014046, 0.052287641912698746, -0.03598639741539955, 0.05893125757575035, -0.04137209802865982, 0.011068128980696201, -0.06258238106966019, 0.05671095848083496, -0.04162446781992912, 0.15205995738506317, 0.06888017058372498, -0.06126286834478378, 0.03598131984472275, 0.05650391802191734, 0.06183280050754547, -0.02352617308497429, -0.015995021909475327, -0.03013666719198227, -0.014746074564754963, 0.017698364332318306, 0.0924161896109581, -0.003044591750949621, -0.02951236441731453, -0.11715888231992722, -0.055808160454034805, -0.04605674371123314, -0.10316657274961472, -0.012336591258645058, -0.026204492896795273, 0.0027793976478278637, 0.018452806398272514, -0.06246175989508629, 0.023571135476231575, 0.01674182340502739, -0.011907193809747696, 0.0031487364321947098, 0.02872726134955883, -0.030260834842920303, 0.013076328672468662, -0.054674554616212845, 0.030086921527981758, -0.019088763743638992, -0.028017403557896614, 0.03926639258861542, 0.05236378312110901, 0.013917805626988411, -0.05134301632642746, 0.012767687439918518, -0.026227429509162903, -0.01021269429475069, 0.04675579071044922, 0.0879572406411171, 0.06367393583059311, -0.03425789251923561, 0.08145802468061447, 0.05812731757760048, -0.05360660329461098, 0.09117008745670319, 0.054346147924661636, 0.061811912804841995, 0.0022994207683950663, 0.02173011191189289, -0.0010154503397643566, -0.04911629855632782, -0.010855695232748985, 0.03750362992286682, -0.03868148848414421, -0.01226317510008812, 0.022867081686854362, 0.03505559638142586, -0.06509360671043396, 0.0431000292301178, -0.06411410123109818, -0.04346365109086037, -0.08546481281518936, 0.03659137338399887, 0.18585078418254852, -0.016210559755563736, 0.017602287232875824, 0.07810717076063156, -0.0003528650850057602, -0.05196056514978409, 0.03429535776376724, 0.0911516547203064, -0.05730742588639259, -0.01743202470242977, 0.01992412842810154, -0.02962811104953289, -0.0166860930621624, -0.07310621440410614, 0.03271517902612686, -0.029564397409558296, -0.009661223739385605, 0.09157568216323853, -0.007300205994397402, 0.03478018566966057, 0.08598203957080841, -0.08012408763170242, 0.03174588084220886, -0.051728177815675735, -0.10738082230091095, 0.06439372897148132, -0.024732163175940514, -0.035300299525260925, 0.06776843965053558, 0.004307807423174381, -0.011278616264462471, -0.040609315037727356, 0.027761094272136688, -0.001928056008182466, 0.02381337247788906, 0.025773385539650917, -0.07285520434379578, 0.024837255477905273, -0.0005605467595160007, 0.05281779542565346, -0.04463830962777138, 0.034453630447387695, 0.06900957971811295, 0.005336567759513855, 0.043570540845394135, -0.030410215258598328, 0.02100208029150963, -0.07809555530548096, 0.07820349931716919, 0.03241743892431259, 0.059150394052267075, 0.03512212261557579, 0.006884916219860315, -0.027858445420861244, 0.004843162372708321, -0.04637754708528519, 0.022954687476158142, 0.09142466634511948, 0.01837337017059326, 0.07858093827962875, 0.03739725053310394, -0.06181540712714195, 0.023278608918190002, 0.06668300926685333, 0.03162689134478569, 0.034481946378946304, 0.004703270737081766, -0.00448651285842061, -0.035087063908576965, 0.002508430741727352, -0.024410555139183998, 0.0737726241350174, 0.025281058624386787, 0.07365147769451141, 0.05713231489062309, 0.03967548906803131, -0.0750693753361702, -0.025054670870304108, 0.10820469260215759, -0.022841161116957664, -0.050563935190439224, -0.09182245284318924, -0.05874142423272133, -0.010966412723064423, -0.03739366680383682, -0.0017392662120983005, 0.02779448963701725, 0.059071749448776245, -0.10051697492599487, 0.007565637584775686, 0.0004582611145451665, -0.10849790275096893, -0.012799902819097042, -0.0038468330167233944, -0.10419396311044693, -0.06546372920274734, -0.0009321157122030854, 0.04565180465579033, -0.18614117801189423, 0.00863052811473608, 0.01929248310625553, -0.09895684570074081, 0.016350936144590378, -0.06304658949375153, 0.024120552465319633, 0.032405562698841095, -0.01158100925385952, 0.08401751518249512, -0.04670768603682518, 0.08062569797039032, 0.031155720353126526, 0.0017044987762346864, -0.036426007747650146, -0.008030770346522331, -0.028740253299474716, 0.0221669040620327, 0.04032621905207634, 0.00382498768158257, 0.027974214404821396, -0.03601902350783348, 0.02634100429713726, -0.0526307113468647, 0.04034155234694481, -0.03145713359117508, -0.07951541244983673, -0.035019636154174805, -0.017789088189601898, -0.09499502927064896, 0.045302681624889374, 0.031500428915023804, 0.036407507956027985, 0.016044028103351593, -0.051019031554460526, 0.027445968240499496, 0.059877343475818634, -0.005989632569253445, -0.0844760462641716, 0.12996318936347961, -0.002364642918109894, -0.10852324217557907, 0.0005152004887349904, -0.0009007704211398959, 0.06669764220714569, -0.04522520303726196, 0.012631850317120552, -0.010072794742882252, 0.02177802473306656, 0.003127241274341941, 0.09995120018720627, -0.0010360970627516508, -0.004627043381333351, -0.03782869502902031, -0.0865999311208725, -0.06037161499261856, -0.050766635686159134, 0.01130732987076044, -0.057273466140031815, 0.017765475437045097, 0.017757568508386612, -0.03006371110677719, -0.0830991119146347, -0.02776247262954712, -0.03580504655838013, -0.09588706493377686, 0.08296535909175873, 0.05229318514466286, -0.04515818879008293, -0.05035253241658211, -0.01675960049033165, -0.0049682739190757275, 0.05941714346408844, 0.024265799671411514, 0.05355130136013031, -0.038297902792692184, -0.026783868670463562, -0.055414967238903046, -0.009069208987057209, 0.02992071770131588, -0.025247296318411827, 0.10157250612974167, 0.020468782633543015, -0.005405390169471502, 0.01737665943801403, -0.02434743009507656, 0.03669673949480057, -0.012890439480543137, 0.044806547462940216, -0.04173910617828369, -0.004346023313701153, 0.02256465144455433, 0.07016265392303467, 0.0002818784851115197, 0.03859787434339523, -0.04648749157786369, 0.033964622765779495, 0.0475643053650856, 0.03537638485431671, -0.02313327044248581, -0.07226047664880753, -0.06665146350860596, 0.05353984236717224, 0.05530821159482002, 0.08132265508174896, -0.052982259541749954, -0.03681959584355354, 0.0022982980590313673, -0.06337310373783112, 0.0016566436970606446, -0.013318322598934174, -0.018208038061857224, 0.03851032257080078, 0.02762928232550621, -0.10264097154140472, 0.019825825467705727, -0.057000890374183655, -0.03370371833443642, -0.010463220067322254, -0.02364305593073368, -0.10540378838777542, 0.04942377656698227, -0.1155300885438919, 0.022656787186861038, -0.058638449758291245, -0.10549267381429672, 0.04881560057401657, -0.0027417561504989862, -0.006386774592101574, 0.021896198391914368, -0.04008129611611366, 0.01804390735924244, 0.0832149013876915, -0.07690286636352539, -0.02425014227628708, -0.06672544032335281, -0.032684434205293655, 0.0283314548432827, 0.020688742399215698, 0.0007676251116208732, 0.028706533834338188, 0.043194063007831573, -0.007237447891384363, 0.034386634826660156, -0.018901383504271507, 0.0012224490055814385, 0.034673985093832016, -0.05789951607584953, -0.07083290070295334, -0.06842870265245438, 0.023140378296375275, -0.047216784209012985, -0.015203755348920822, 0.01728920452296734, 0.021323077380657196, -0.00361688737757504, -0.09357771277427673, -0.01752626523375511, 0.0272016953676939, -0.016707075759768486, 0.015414653345942497, 0.07550539076328278, -0.02128022536635399, -0.03699357062578201, -0.04042341560125351, 0.04941912367939949, 0.009178324602544308, 0.009957287460565567, 0.021167051047086716, -0.07893045246601105, 0.0917615070939064, -0.035101018846035004, 0.0067708054557442665, -0.020636290311813354, 0.035510074347257614, 0.015622514300048351, -0.012924237176775932, 0.11762026697397232, -0.04080066829919815, 0.040495697408914566, 0.005748016759753227, -0.07496850937604904, -0.005310157313942909, 0.05559217557311058, 0.022710632532835007, -0.06277304887771606, 0.0834464430809021]"
3,1,privaten pädagogischen,privat pädagogisch,0.6817,ADJ NOUN,74,96,"[0.016026685014367104, 0.0017476006178185344, -0.05314597487449646, 0.018245095387101173, 0.004732773173600435, 0.004225023090839386, -0.05356220155954361, 0.010315547697246075, 0.013905704952776432, 0.023497510701417923, 0.017649788409471512, 0.10878106951713562, 0.034262143075466156, 0.04103129729628563, -0.005812716670334339, -0.014324533753097057, 0.0016073117731139064, 0.04968142509460449, 0.0726785808801651, 0.06424277275800705, 0.024093085899949074, -0.04387516528367996, -0.009755827486515045, -0.02703654021024704, -0.02332880347967148, -0.04093065857887268, 0.037219755351543427, -0.04485808685421944, -0.018662303686141968, -0.13199935853481293, 0.017546404153108597, -0.1172303780913353, 0.0060605076141655445, 0.05089803785085678, -0.03969917073845863, 0.05507291853427887, 0.010586092248558998, 0.018440743908286095, 0.024941062554717064, -0.027753928676247597, 0.019054848700761795, -0.008883889764547348, -0.025252308696508408, 0.049893490970134735, 0.008433034643530846, -0.03275000676512718, -0.04316455125808716, -0.014310747385025024, -0.017944449558854103, -0.0876379907131195, -0.09456778317689896, -0.04393313080072403, -0.06365875899791718, -0.03585253655910492, -0.009909548796713352, -0.028452496975660324, 0.08394928276538849, 0.03806878998875618, -0.043901823461055756, 0.1103372722864151, -0.046559661626815796, 0.011116639710962772, -0.09174221009016037, 0.025325803086161613, 0.03292621672153473, 0.0582621768116951, 0.03650955110788345, 0.036539074033498764, 0.008041124790906906, -0.013482431881129742, -0.0008151010842993855, 0.003868325613439083, 0.026723243296146393, 0.023774029687047005, 0.10514411330223083, -0.005641223397105932, -0.023809392005205154, 0.07280592620372772, 0.06165945902466774, -0.05087582767009735, 0.04653354734182358, 0.04209289699792862, 0.03566247597336769, 0.05472315847873688, -0.07373078912496567, 0.016185084357857704, -0.006342259701341391, 0.0006009661592543125, 0.03111329860985279, -0.048059310764074326, 0.035162586718797684, -0.10425780713558197, 0.010548051446676254, 0.013670207001268864, 0.06318197399377823, -0.038424380123615265, -0.014730839058756828, -0.07366044819355011, 0.0351521335542202, 0.2740519046783447, -0.08123665302991867, 0.012146645225584507, 0.04681582748889923, -0.04635704681277275, -0.044203151017427444, -0.020499419420957565, 0.0586387924849987, -0.09513063728809357, -0.034056831151247025, -0.017982088029384613, -0.01499641127884388, -0.03711046651005745, -0.03929927945137024, -0.008256449364125729, 0.026159949600696564, 0.00798928551375866, 0.05807508900761604, 0.04218485578894615, 0.025377318263053894, -0.0018929803045466542, -0.029884807765483856, 0.025162646546959877, 0.05899918079376221, -0.10348977893590927, 0.012171338312327862, -0.0983583852648735, -0.04676322266459465, 0.08988327533006668, 0.02851918339729309, 0.030580583959817886, -0.010181406512856483, 0.01731100305914879, -0.05294365808367729, 0.046328525990247726, 0.034664031118154526, -0.012213039211928844, -0.041771430522203445, -0.033809978514909744, 0.13571307063102722, 0.06835827231407166, 0.017380595207214355, 0.03605680167675018, 0.013403859920799732, 0.08958921581506729, 0.008440675213932991, 0.028977852314710617, 0.11372383683919907, 0.07098755985498428, -0.0016186753055080771, 0.054062943905591965, 0.052831459790468216, 0.006084106396883726, -0.0013305778848007321, -0.058544743806123734, 0.0345158651471138, -0.03389502689242363, 0.06636908650398254, 0.026770975440740585, 0.0426858626306057, -0.022982493042945862, -0.09704917669296265, 0.02013280801475048, 0.0386621318757534, 0.006280509755015373, 0.08359774947166443, -0.06666749715805054, -0.004633952397853136, -0.09211254119873047, -0.02945885993540287, -0.024336155503988266, 0.05946757644414902, 0.0019445515936240554, -0.029767736792564392, 0.046991217881441116, -0.010339990258216858, -0.056168071925640106, -0.034049734473228455, 0.03166570886969566, -0.07174073904752731, -0.030159983783960342, -0.02836446836590767, -0.07677685469388962, -0.029529262334108353, 0.006816142238676548, -0.02111709676682949, 0.02583349496126175, 0.01518107671290636, -0.010918742045760155, 0.08941984176635742, 0.12505948543548584, -0.09261293709278107, 0.04401908814907074, -0.03726751729846001, -0.05762013792991638, -0.06560564041137695, 0.010100160725414753, 0.1637657880783081, -0.1279904693365097, -0.034182317554950714, 0.0332641564309597, -0.09326894581317902, 0.006604825146496296, 0.013485779985785484, -0.01782720908522606, -0.002045578323304653, -0.023898299783468246, 0.040380820631980896, -0.023508243262767792, 0.019121648743748665, 0.05515705794095993, 0.014770190231502056, 0.04532362148165703, -0.020053789019584656, 0.007751022465527058, -0.011820961721241474, 0.08178205788135529, -0.06914103776216507, 0.05385017395019531, -0.04627559334039688, 0.018698852509260178, -0.03864593803882599, 0.049212269484996796, -0.009900427423417568, -0.087922602891922, -0.043354228138923645, -0.02586652897298336, -0.0773538127541542, 0.06351354718208313, 0.0549180693924427, -0.024533936753869057, -0.003077202243730426, -0.0536922886967659, -0.00879649817943573, 0.0526246502995491, -0.05271592363715172, -0.06510160863399506, 0.11352387815713882, 0.05283245071768761, -0.07951223850250244, 0.018805282190442085, -0.05436104163527489, 0.006290852092206478, -0.055214207619428635, 0.03292545676231384, -0.045340001583099365, 0.033271268010139465, 0.0031305174343287945, 0.04872235655784607, 0.07462010532617569, -0.0027182300109416246, -0.08705654740333557, -0.017665265128016472, -0.04922463744878769, -0.015103419311344624, 0.016941223293542862, 0.002322320593520999, -0.0807918831706047, -0.058499474078416824, -0.09252242743968964, -0.05143117159605026, -0.02306216210126877, -0.06688390672206879, -0.04377815127372742, 0.061985041946172714, 0.043600983917713165, -0.005013894289731979, -0.02316158451139927, -0.05563526973128319, -0.01635412685573101, -0.032129961997270584, -0.03197433426976204, -0.042711466550827026, -0.00887866597622633, 0.030790850520133972, -0.03799981251358986, 0.010126219131052494, 0.017150837928056717, -0.09859468787908554, 0.02114284224808216, -0.02277950569987297, -0.019083915278315544, 0.0459931455552578, 0.06181756779551506, 0.03308168053627014, 0.07735393941402435, -0.009229953400790691, -0.0367431715130806, 0.006235555279999971, -0.0432569719851017, 0.01568969525396824, 0.012000255286693573, 0.07731066644191742, -0.040073707699775696, 0.03809591755270958, 0.03942810371518135, -0.0011866067070513964, 0.029019106179475784, -0.01620353013277054, -8.151627116603777e-05, 0.10428663343191147, 0.03125739097595215, -0.05378326028585434, -0.08240104466676712, 0.04196874052286148, 0.06316866725683212, -0.012555730529129505, -0.014991612173616886, -0.016460346058011055, -0.0007793541299179196, -0.0037401861045509577, 0.07980271428823471, -0.053038883954286575, 0.03728950396180153, -0.04635997861623764, 0.014861272647976875, -0.0703030601143837, 0.005109200719743967, -0.04127301275730133, 0.01366669312119484, -0.1297280639410019, -0.017809029668569565, -0.013553544878959656, 0.050075728446245193, 0.06152038648724556, -0.005468017887324095, 0.017190605401992798, -0.03772607445716858, -0.02360808663070202, -0.021178243681788445, 0.027645492926239967, -0.1102544441819191, -0.060922957956790924, 0.00548954214900732, 0.016470151022076607, 0.007640166208148003, -0.0013710440834984183, 0.027737803757190704, 0.03852114826440811, 0.02954309992492199, 0.008179748430848122, 0.07338523119688034, -0.006661418825387955, 0.007836359553039074, 0.0726483091711998, -0.07615252584218979, -0.03383127227425575, 0.023319236934185028, -0.023871228098869324, -0.04171557351946831, 0.011496997438371181, 0.028761794790625572, 0.013164296746253967, 0.024671513587236404, -0.05643732473254204, -0.048220161348581314, 0.03709328547120094, -0.012868253514170647, 0.003279466414824128, 0.006036120001226664, 0.04642835259437561, -0.03795819357037544, -0.08770070970058441, 0.0556410476565361, 0.03811202570796013, 0.02027621679008007, 0.05110292136669159, -0.04103192314505577, 0.023508163169026375, 0.0127505948767066, 0.00848645530641079, 0.049864839762449265, -0.0440513901412487, -0.014085708186030388, -0.09729102998971939, 0.051583170890808105, 0.05190696194767952, 0.08112519979476929, 0.005565792787820101, -0.09626203775405884, 0.027682211250066757, 0.004935853183269501, 0.02617589943110943, -0.037044525146484375, 0.050931718200445175]"
4,1,hochschule burgenland,hochschule burgenland,0.6308,NOUN VERB,97,118,"[0.056962572038173676, 0.08657726645469666, -0.03909336403012276, -0.00334254652261734, -0.02765103615820408, -0.0425863191485405, -0.0004893316654488444, 0.05961208790540695, -0.010172360576689243, 0.017220785841345787, 0.036075957119464874, -0.09701685607433319, 0.017108220607042313, 0.019426623359322548, -0.004748285748064518, -0.020871814340353012, 0.02052338980138302, 0.07784771174192429, 0.0775308683514595, -0.01810351200401783, -0.007174672558903694, -0.04282454773783684, 0.012948841787874699, -0.04065529257059097, 0.052734922617673874, -0.03211318701505661, 0.0029678274877369404, -0.05525650829076767, 0.01196009386330843, -0.059624332934617996, 0.023175612092018127, -0.07170560210943222, 0.14754660427570343, -0.0052931965328752995, -0.04181423410773277, 0.08520793914794922, 0.012151889503002167, 0.04821239784359932, 0.03375271335244179, 0.04142482578754425, -0.05013291910290718, -0.0011777571635320783, 0.008708765730261803, 0.061116788536310196, 0.017305994406342506, 0.005788631271570921, -0.024467144161462784, -0.007341095246374607, -0.006392895244061947, -0.021157346665859222, -0.001713845762424171, -0.03550874814391136, -0.0888945534825325, -0.032211195677518845, -0.0038111787289381027, 0.026815548539161682, 0.030056515708565712, 0.03453974425792694, -0.002450021915137768, 0.023337772116065025, 0.00817700196057558, 0.08781267702579498, -0.1276894211769104, -0.008853810839354992, -0.048637744039297104, -0.04079090803861618, 0.024694038555026054, 0.08314419537782669, -0.03299035504460335, 0.02962096408009529, 0.03025318868458271, -0.04617483168840408, -0.015808532014489174, 0.04127172380685806, 0.050877079367637634, 0.02738524042069912, -0.03720509633421898, 0.061230022460222244, -0.04037198796868324, -0.05046771094202995, 0.03912696614861488, -0.05097023770213127, 0.0032391746062785387, -0.04168245941400528, -0.003831441979855299, 0.006653670687228441, -0.0028276299126446247, 0.0595543310046196, 0.08644891530275345, -0.07505214959383011, 0.09518800675868988, -0.05593118071556091, 0.020757613703608513, -0.05181838944554329, 0.06329570710659027, 0.007254110649228096, 0.005749745760113001, -0.05819595232605934, 0.04709295555949211, 0.26883095502853394, -0.010896583087742329, 0.009847049601376057, 0.02455775812268257, 0.02092602290213108, -0.044009286910295486, 0.01443819422274828, 0.034861162304878235, -0.033466652035713196, -0.009501022286713123, 0.017247602343559265, -0.03276515379548073, -0.07185782492160797, -0.05434801056981087, 0.005098024848848581, 0.009519428014755249, 0.011762022972106934, 0.04337850213050842, 0.0011930384207516909, 0.018201110884547234, 0.0479435957968235, -0.010854482650756836, 0.002107496839016676, 0.022677328437566757, -0.044162724167108536, 0.002249337499961257, -0.06080882251262665, 0.012743936851620674, 0.09812548756599426, -0.008686725050210953, 0.01792220026254654, 0.07583126425743103, 0.08647632598876953, -0.022267764434218407, 0.027451345697045326, -0.0219347532838583, -0.02268478088080883, 0.039314232766628265, 0.04663115739822388, -0.013255083933472633, -0.06753534823656082, -0.023701675236225128, 0.029918529093265533, 0.010014299303293228, 0.00340469041839242, -0.010699448175728321, -0.015123189426958561, -0.038739997893571854, 0.05661731958389282, 0.04384201765060425, 0.04717547446489334, -0.034780777990818024, -0.04701283201575279, 0.04898589849472046, -0.023440180346369743, -0.008818316273391247, 0.020693503320217133, 0.054022155702114105, 0.04736173152923584, 0.09135231375694275, -0.002048393478617072, -0.05044148489832878, 0.028968116268515587, 0.08620085567235947, -0.028221258893609047, -0.0005837288917973638, -0.007713846862316132, 0.01102223340421915, -0.04462023824453354, 0.02994297817349434, -0.011441346257925034, 0.04209381341934204, 0.04675717279314995, 0.09683705121278763, 0.10283352434635162, 0.040042608976364136, -0.01499870978295803, -0.03260455280542374, 0.025553490966558456, -0.024589279666543007, -0.009718261659145355, -0.06176735460758209, -0.008292600512504578, -0.026646388694643974, 0.021370990201830864, -0.0039603873156011105, 0.05624046549201012, 0.02273782715201378, -0.06636517494916916, 0.08728866279125214, 0.06745785474777222, -0.04300014674663544, -0.02769148163497448, -0.03211994469165802, -0.1339147984981537, -0.06345970928668976, 0.00989063922315836, 0.057427626103162766, -0.1141648218035698, -0.029478788375854492, 0.0397421196103096, -0.09967076778411865, 0.012527531012892723, -0.02097967080771923, -0.004523662384599447, 0.047920312732458115, -0.011733868159353733, 0.03682669997215271, -0.00261376122944057, 0.0014061336405575275, 0.021161993965506554, -0.00028842539177276194, -0.004702882841229439, 0.040281932801008224, -0.026904966682195663, -0.016163835301995277, 0.01790553890168667, -0.0035355861764401197, 0.021192746236920357, -0.11060043424367905, 0.04317348450422287, -0.026382949203252792, -0.034151170402765274, 0.007962589152157307, -0.1641259640455246, 0.03511330485343933, -0.04521141201257706, -0.07907982915639877, 0.024964377284049988, -0.004417745396494865, -0.002802639501169324, -0.019949713721871376, 0.0015095664421096444, -0.005330082029104233, -0.0005415189662016928, -0.0656806081533432, -0.04597422853112221, 0.09787721931934357, -0.007039735559374094, -0.049973245710134506, -0.05235089361667633, 0.01771034300327301, -0.03113604336977005, -0.09145111590623856, 0.02810378186404705, -0.016081804409623146, -0.0070390463806688786, -0.013500064611434937, 0.0624212920665741, -0.028328781947493553, 0.07915518432855606, -0.04857519641518593, -0.058657966554164886, -0.08794774115085602, 0.006708226632326841, -0.005386730190366507, 0.00047868862748146057, -0.003106104675680399, 0.04994167014956474, -0.01626468449831009, -0.024484308436512947, 0.08329994976520538, -0.06326854228973389, -0.10446170717477798, 0.030997104942798615, 0.058381304144859314, -0.04658573493361473, -0.009477327577769756, 0.027642982080578804, -0.0007130078156478703, 0.04240423068404198, -0.043751053512096405, 0.027073824778199196, -0.04093245044350624, -0.05337635800242424, 0.004962887614965439, -0.03380616381764412, 0.007317240349948406, -0.03619120642542839, 0.07499001920223236, 0.04820002242922783, -0.008872884325683117, -0.04474819824099541, -0.0005070235347375274, 0.014385971240699291, 0.011753616854548454, -0.00606463011354208, -0.03746941685676575, 0.03701825439929962, -0.014531443826854229, 0.04022727906703949, -0.012245276011526585, 0.08334056288003922, -0.08656756579875946, 0.027750475332140923, 0.029434384778141975, 0.017471974715590477, 0.00367155484855175, 0.013067454099655151, -0.09120162576436996, 0.08511600643396378, 0.08727850019931793, 0.021898947656154633, -0.04036153107881546, -0.08700168132781982, -0.06728796660900116, -0.05322907865047455, -0.05398634821176529, 0.027989119291305542, -0.0070649017579853535, 0.013395259156823158, 0.02141193486750126, -0.09604120999574661, 0.09732785075902939, -0.03724086284637451, -0.0014956268714740872, 0.028313295915722847, -0.002035849029198289, -0.07861723750829697, 0.07043111324310303, -0.18410424888134003, -0.03552308306097984, -0.035829536616802216, -0.14953748881816864, 0.08759760111570358, 0.02705986611545086, -0.05896171182394028, 0.01158221997320652, -0.02952706068754196, -0.005813836120069027, 0.023772981017827988, -0.10798123478889465, -0.0011183222522959113, -0.08108650892972946, -0.04138405993580818, 0.06911096721887589, 0.0008745487430132926, 0.005146391689777374, 0.016145914793014526, 0.01905716024339199, -0.008862610906362534, 0.0042722090147435665, 0.03462269902229309, -0.009851882234215736, -0.001674184575676918, -0.07669462263584137, -0.05994207784533501, -0.03307518735527992, -0.05267734080553055, 0.02326439879834652, 0.004924978129565716, 0.012790150009095669, 0.09836570918560028, -0.06018956005573273, -0.07987358421087265, 0.032333243638277054, 0.06934433430433273, -0.05044975504279137, 0.047379180788993835, 0.03503207489848137, -0.056930918246507645, 0.044887103140354156, -0.06260120123624802, 0.05462503060698509, 0.05515137314796448, 0.046036459505558014, 0.04757332429289818, -0.030880050733685493, 0.08523014932870865, -0.003443164750933647, 0.06855472177267075, -0.09731083363294601, 0.07404830306768417, 0.021078824996948242, -0.06542203575372696, 0.06509719789028168, 0.022358709946274757, -0.015483537688851357, -0.04850572720170021, -0.07103826105594635, 0.03851741552352905, 0.03556850180029869, -0.027438385412096977, -0.044819124042987823, 0.06018131598830223]"
