In [None]:
import os
import re

def find_longest_text_and_word_in_directory(directory):
    longest_text = ""
    longest_word = ""
    max_text_length = 0
    max_word_length = 0

    # Iterate through all files in the directory
    for file in os.listdir(directory):
        if file.endswith('.txt'):
            file_path = os.path.join(directory, file)
            with open(file_path, 'r', encoding='utf-8') as file_open:
                content = file_open.read()
                # Find the longest text
                if len(content) > max_text_length:
                    max_text_length = len(content)
                    longest_text = content
                
                # Regex pattern to find text between start and end tags
                pattern = r'<start_"([^"]+)">([^<]+)<end_"([^"]+)">'
                # Find all matches
                matches = re.findall(pattern, content)
                
                for match in matches:
                    # Get the text between tags
                    between_tags = match[1]
                    # Check if the text is longer than the current longest word
                    if len(between_tags) > max_word_length:
                        max_word_length = len(between_tags)
                        longest_word = between_tags

    return longest_text, longest_word

# Example directory
directory = "."  # Current directory
longest_text, longest_word = find_longest_text_and_word_in_directory(directory)

print("Longest text:")
print(longest_text)
print("Longest word between tags:")
print(longest_word)

print("Length of longest text:", len(longest_text))
print("Length of longest word:", len(longest_word))


In [1]:
import sys
from PyQt5.QtWidgets import QApplication, QWidget, QLabel, QVBoxLayout, QPushButton, QFileDialog, QComboBox
import easyocr
import pytesseract
from PIL import Image

class ImageReader(QWidget):
    def __init__(self):
        super().__init__()

        self.setWindowTitle("Image Text Reader")
        self.setGeometry(100, 100, 400, 250)

        self.layout = QVBoxLayout()

        self.image_label = QLabel("Görsel burada görünecek")
        self.layout.addWidget(self.image_label)

        self.load_button = QPushButton("Görsel Yükle")
        self.load_button.clicked.connect(self.load_image)
        self.layout.addWidget(self.load_button)

        self.ocr_selector = QComboBox()
        self.ocr_selector.addItems(["EasyOCR", "Tesseract OCR"])
        self.layout.addWidget(self.ocr_selector)

        self.text_label = QLabel("Metin burada görünecek")
        self.layout.addWidget(self.text_label)

        self.setLayout(self.layout)

    def load_image(self):
        options = QFileDialog.Options()
        file_path, _ = QFileDialog.getOpenFileName(self, "Görsel Yükle", "", "Image files (*.jpg *.png *.jpeg *.bmp *.gif)", options=options)
        if file_path:
            self.process_image(file_path)

    def process_image(self, file_path):
        ocr_method = self.ocr_selector.currentText()

        if ocr_method == "EasyOCR":
            reader = easyocr.Reader(['tr'])  # Türkçe dil modellerini kullan
            results = reader.readtext(file_path)
            text = "\n".join([detection[1] for detection in results])
        else:  # Tesseract OCR
            text = pytesseract.image_to_string(Image.open(file_path), lang='tur')

        self.text_label.setText(text)

if __name__ == "__main__":
    app = QApplication(sys.argv)
    window = ImageReader()
    window.show()
    sys.exit(app.exec_())


SystemExit: 0

  warn("To exit: use 'exit', 'quit', or Ctrl-D.", stacklevel=1)
