Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Feat(components): nested classifier #836

Merged
merged 1 commit into from
Oct 16, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
36 changes: 36 additions & 0 deletions examples/demo_rank_largest_animal.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
# -*- coding: utf-8 -*-
# Time : 2023/10/16 4:56
# Author : QIN2DIM
# GitHub : https://github.com/QIN2DIM
# Description:
import os
from pathlib import Path

import hcaptcha_challenger as solver

solver.install(upgrade=True)

prompt = "Please click on the largest animal."

data_dir = Path(__file__).parent.joinpath("largest_animal")

pending_keys = ["hedgehog", "rabbit", "raccoon"]


def bytedance():
for pk in pending_keys:
example_paths = [data_dir.joinpath(f"example_{pk}.png")]
images_dir = data_dir.joinpath(pk)
image_paths = [images_dir.joinpath(image_name) for image_name in os.listdir(images_dir)]

classifier = solver.BinaryClassifier()

if result := classifier.execute(prompt, image_paths, example_paths):
print(f">> Match model - resnet={classifier.model_name} prompt={prompt}")
for i, image_path in enumerate(image_paths):
desc = f"{image_path.parent.name}/{image_path.name}"
print(f">> {desc} - result={result[i]}")


if __name__ == "__main__":
bytedance()
Binary file added examples/largest_animal/example_hedgehog.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/example_rabbit.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/example_raccoon.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/f1.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/f2.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/f3.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/f4.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/f5.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/t1.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/t2.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/t3.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/hedgehog/t4.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/f1.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/f2.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/f3.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/f4.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/f5.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/f6.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/t1.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/t2.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/rabbit/t3.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/raccoon/f1.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/raccoon/f2.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/raccoon/f3.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/raccoon/f4.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added examples/largest_animal/raccoon/f5.png
Binary file added examples/largest_animal/raccoon/f6.png
Binary file added examples/largest_animal/raccoon/true_1.png
Binary file added examples/largest_animal/raccoon/true_2.png
Binary file added examples/largest_animal/raccoon/true_3.png
86 changes: 69 additions & 17 deletions hcaptcha_challenger/components/image_classifier.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,39 +23,91 @@ def __init__(self):
self.modelhub = ModelHub.from_github_repo()
self.modelhub.parse_objects()

def execute(self, prompt: str, images: List[Path | bytes]) -> List[bool | None]:
response = []
self.response: List[bool | None] = []
self.prompt: str = ""
self.label: str = ""
self.model_name: str = ""

def _parse_label(self, prompt: str):
self.prompt = prompt
lang = "zh" if re.compile("[\u4e00-\u9fa5]+").search(prompt) else "en"
_label = split_prompt_message(prompt, lang=lang)
label = label_cleaning(_label)
_label = label_cleaning(prompt)
_label = split_prompt_message(_label, lang=lang)
self.label = _label

focus_label = self.modelhub.label_alias.get(label)
if not focus_label:
logger.debug("Types of challenges not yet scheduled", label=label, prompt=prompt)
return response
def rank_models(
self, nested_models: List[str], example_paths: List[Path | bytes]
) -> ResNetControl | None:
# {{< Rank ResNet Models >}}
rank_ladder = []
for example_path in example_paths:
if isinstance(example_path, bytes):
img_stream = example_path
elif isinstance(example_path, Path):
img_stream = example_path.read_bytes()
else:
continue

focus_name = focus_label if focus_label.endswith(".onnx") else f"{focus_label}.onnx"
net = self.modelhub.match_net(focus_name)
control = ResNetControl.from_pluggable_model(net)
for model_name in nested_models:
net = self.modelhub.match_net(focus_name=model_name)
control = ResNetControl.from_pluggable_model(net)
result_, proba = control.execute(img_stream, proba=True)
if result_:
rank_ladder.append([control, model_name, proba])
if proba[0] > 0.87:
break

# {{< Catch-all Rules >}}
if rank_ladder:
alts = sorted(rank_ladder, key=lambda x: x[-1][0], reverse=True)
best_model, model_name = alts[0][0], alts[0][1]
self.model_name = model_name
return best_model

def inference(self, images: List[Path | bytes], control: ResNetControl):
for image in images:
try:
if isinstance(image, Path):
if not image.exists():
response.append(None)
self.response.append(None)
continue
image = image.read_bytes()
if isinstance(image, bytes):
result = control.execute(image)
response.append(result)
self.response.append(result)
else:
response.append(None)
self.response.append(None)
except Exception as err:
logger.debug(str(err), label=focus_label, prompt=prompt)
response.append(None)
logger.debug(str(err), prompt=self.prompt)
self.response.append(None)

def execute(
self,
prompt: str,
images: List[Path | bytes],
example_paths: List[Path | bytes] | None = None,
) -> List[bool | None]:
self.response = []

self._parse_label(prompt)

# Match: model ranker
if nested_models := self.modelhub.nested_categories.get(self.label, []):
if model := self.rank_models(nested_models, example_paths):
self.inference(images, model)
# Match: common binary classification
elif focus_label := self.modelhub.label_alias.get(self.label):
self.model_name = (
focus_label if focus_label.endswith(".onnx") else f"{focus_label}.onnx"
)
net = self.modelhub.match_net(self.model_name)
control = ResNetControl.from_pluggable_model(net)
self.inference(images, control)
# Match: Unknown cases
else:
logger.debug("Types of challenges not yet scheduled", label=self.label, prompt=prompt)

return response
return self.response


class LocalBinaryClassifier:
Expand Down