In [1]:
from azure.core.credentials import AzureKeyCredential
from azure.ai.textanalytics import TextAnalyticsClient

import os
import openai
from dotenv import load_dotenv, dotenv_values

load_dotenv()
config = dotenv_values(".env")

API_KEY = config["API_KEY"]
ENDPOINT = config["ENDPOINT"]

In [2]:
def client():
    try:
        ta_credential = AzureKeyCredential(API_KEY)
        text_analytics_client = TextAnalyticsClient(
            endpoint=ENDPOINT, 
            credential=ta_credential)
        return text_analytics_client
    except Exception as e:
        print("Error: {e}")
        return None

In [3]:
client = client()

text_strings = [
    "This is written in English.",
    "Ceci est écrit en Français.",
    "Dies ist in deutscher Sprache geschrieben.",
    "Esto está escrito en español.",
    "Questo è scritto in italiano.",
    "これは日本語で書かれています。",
    "이것은 한국어로 쓰여졌습니다.",
    "這是用中文寫的。"
]

response = client.detect_language(documents=text_strings, country_hint="US")


In [6]:
for idx, language_detected in enumerate(response):
    print('original text:')
    print(text_strings[idx])
    print('Language detected: {0}'.format(language_detected.primary_language.name))
    print('Language confidence score: {0}'.format(language_detected.primary_language.confidence_score))
    print("")

original text:
This is written in English.
Language detected: English
Language confidence score: 0.99

original text:
Ceci est écrit en Français.
Language detected: French
Language confidence score: 1.0

original text:
Dies ist in deutscher Sprache geschrieben.
Language detected: German
Language confidence score: 1.0

original text:
Esto está escrito en español.
Language detected: Spanish
Language confidence score: 1.0

original text:
Questo è scritto in italiano.
Language detected: Italian
Language confidence score: 1.0

original text:
これは日本語で書かれています。
Language detected: Japanese
Language confidence score: 1.0

original text:
이것은 한국어로 쓰여졌습니다.
Language detected: Korean
Language confidence score: 1.0

original text:
這是用中文寫的。
Language detected: Chinese_Traditional
Language confidence score: 1.0

