In [1]:
import spacy
from spacy import displacy

# Lade das englische Modell
nlp = spacy.load('en_core_web_sm')

# Text analysieren
doc = nlp("Apple is looking at buying U.K. startup for $1 billion")

# Entitäten ausgeben
for ent in doc.ents:
    print(ent.text, ent.start_char, ent.end_char, ent.label_, spacy.explain(ent.label_))

# Visualisierung der Entitäten
displacy.render(doc, style="ent", jupyter=True)


Apple 0 5 ORG Companies, agencies, institutions, etc.
U.K. 27 31 GPE Countries, cities, states
$1 billion 44 54 MONEY Monetary values, including unit


In [3]:
tags = ["GPE", "NORP", "ORDINAL"]
for tag in tags:
    print(f"{tag}: {spacy.explain(tag)}")

GPE: Countries, cities, states
NORP: Nationalities or religious or political groups
ORDINAL: "first", "second", etc.


In [5]:
text = "Dear Joe! I have organized a meeting with Elon Musk from Siemens for tomorrow. Meeting place is Vienna."
doc = nlp(text)

persons = [ent.text for ent in doc.ents if ent.label_ == "PERSON"]
print(persons)


['Joe', 'Elon Musk']


In [16]:
import spacy
import PyPDF2 as pypdf


nlp = spacy.load("de_core_news_sm")

def extract_text_from_pdf(pdf_path):
    with open(pdf_path, "rb") as file:
        reader = pypdf.PdfReader(file)
        text = ""
        for page in reader.pages:
            text += page.extract_text()
    return text
    
pdf_text = extract_text_from_pdf("Bericht.pdf")
doc = nlp(pdf_text)

redacted_text = pdf_text
for ent in doc.ents:
    if ent.label_ == "PER":
        redacted_text = redacted_text.replace(ent.text, "[REDACTED]")

print(redacted_text)

 
  
 
  
Bericht 
 
der unabhängigen  Untersuchungskommission  
zur transparenten  Aufklärung  der Vorkommnisse  rund um die Hypo 
Group Alpe‐Adria 
 
Kurzfassung  
 
  
 
   
Wien, 2. Dezember  2014 
   
  
 
 
 
  
 
 
 
 
 
  
 
 
 
 
 
  
 
 
 Diese Kurzfassung,  eine englische  Übersetzung  und die Langfassung  des Berichts sind unter 
[REDACTED]  abrufbar.  
   
 Inhaltsverzeichnis  
A. [REDACTED]  1 
 
B. ERGEBNISSE  DER UNTERSUCHUNG  .................................................................................  1 
1. Übernahme  von unbeschränkten  Haftungen  durch das Land Kärnten ..........................  1 
2. Verkauf der HBInt an die Bayerische  Landesbank  (BayernLB)  ........................................  3 
3. Verstaatlichung  der HBInt ...............................................................................................  6 
4. Vorgehen  nach der Verstaatlichung  ..............................................................................  13 
 
C. Z