<a href="https://colab.research.google.com/github/Iqra-01/Google_AI_studio_Genai/blob/main/templates/object%20identifier.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

##### Copyright 2023 Google LLC

In [None]:
# @title Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

## Setup

In [1]:
!pip install -U -q "google-generativeai>=0.8.2"

In [2]:
# import necessary modules.
import base64
import copy
import json
import pathlib
import requests


import PIL.Image
import IPython.display
from IPython.display import Markdown

try:
    # The SDK will automatically read it from the GOOGLE_API_KEY environment variable.
    # In Colab get the key from Colab-secrets ("🔑" in the left panel).
    import os
    from google.colab import userdata

    os.environ["GOOGLE_API_KEY"] = userdata.get("GOOGLE_API_KEY")
except ImportError:
    pass

import google.generativeai as genai

# Parse the arguments

model = 'gemini-1.5-flash' # @param {isTemplate: true}
contents_b64 = 'W3sicGFydHMiOlt7InRleHQiOiJXaGF0IG9iamVjdCBpcyB0aGlzPyBEZXNjcmliZSBob3cgaXQgbWlnaHQgYmUgdXNlZCJ9LHsidGV4dCI6Ik9iamVjdDogIn0seyJmaWxlX2RhdGEiOnsibWltZV90eXBlIjoiaW1hZ2UvanBlZyIsInVybCI6Imh0dHBzOi8vd3d3LmdzdGF0aWMuY29tL2Fpc3R1ZGlvL3NhbXBsZS1pbWFnZXMvb2JqZWN0X2lkZW50aWZpZXIxLmpwZyJ9fSx7InRleHQiOiJEZXNjcmlwdGlvbjogVGhpcyBpcyBhIHBpcGUgb3JnYW4uIEl0IGlzIGEgbGFyZ2UgbXVzaWNhbCBpbnN0cnVtZW50IHRoYXQgaXMgdXNlZCBpbiBjaHVyY2hlcywgY29uY2VydCBoYWxscywgYW5kIG90aGVyIGxhcmdlIGJ1aWxkaW5ncy4gSXQgaXMgbWFkZSB1cCBvZiBhIHNlcmllcyBvZiBwaXBlcyB0aGF0IGFyZSBhcnJhbmdlZCBpbiBkaWZmZXJlbnQgc2l6ZXMgYW5kIHNoYXBlcy4gVGhlIHBpcGVzIGFyZSBwbGF5ZWQgYnkgcHJlc3Npbmcga2V5cyBvbiBhIGtleWJvYXJkLiBXaGVuIGEga2V5IGlzIHByZXNzZWQsIGFpciBpcyBmb3JjZWQgdGhyb3VnaCB0aGUgcGlwZSwgd2hpY2ggcHJvZHVjZXMgYSBzb3VuZC4gVGhlIHNvdW5kIG9mIGEgcGlwZSBvcmdhbiBpcyB2ZXJ5IHBvd2VyZnVsIGFuZCBjYW4gYmUgdXNlZCB0byBjcmVhdGUgYSB3aWRlIHZhcmlldHkgb2YgbXVzaWMuIn0seyJ0ZXh0IjoiT2JqZWN0OiAifSx7ImZpbGVfZGF0YSI6eyJtaW1lX3R5cGUiOiJpbWFnZS9qcGVnIiwidXJsIjoiaHR0cHM6Ly93d3cuZ3N0YXRpYy5jb20vYWlzdHVkaW8vc2FtcGxlLWltYWdlcy9vYmplY3RfaWRlbnRpZmllcjIuanBnIn19LHsidGV4dCI6IkRlc2NyaXB0aW9uOiBUaGlzIGlzIGEgc3VuZGlhbC4gSXQgaXMgYSBkZXZpY2UgdGhhdCB1c2VzIHRoZSBzdW4ncyBwb3NpdGlvbiBpbiB0aGUgc2t5IHRvIHRlbGwgdGhlIHRpbWUuIFRoZSBzdW5kaWFsIGhhcyBhIGZsYXQgc3VyZmFjZSB3aXRoIGEgaG9sZSBpbiB0aGUgY2VudGVyLiBBIG1ldGFsIHJvZCBpcyBwbGFjZWQgdGhyb3VnaCB0aGUgaG9sZSBhbmQgaXMgcG9pbnRlZCBhdCB0aGUgTm9ydGggU3Rhci4gVGhlIHNoYWRvdyBvZiB0aGUgcm9kIGZhbGxzIG9uIHRoZSBmbGF0IHN1cmZhY2UgYW5kIGluZGljYXRlcyB0aGUgdGltZS4ifSx7InRleHQiOiJPYmplY3Q6ICJ9LHsiZmlsZV9kYXRhIjp7Im1pbWVfdHlwZSI6ImltYWdlL2pwZWciLCJ1cmwiOiJodHRwczovL3d3dy5nc3RhdGljLmNvbS9haXN0dWRpby9zYW1wbGUtaW1hZ2VzL29iamVjdF9pZGVudGlmaWVyMy5qcGcifX0seyJ0ZXh0IjoiRGVzY3JpcHRpb246ICJ9XX1d' # @param {isTemplate: true}
generation_config_b64 = 'eyJ0ZW1wZXJhdHVyZSI6MC45LCJ0b3BfcCI6MC45NSwidG9wX2siOjQwLCJtYXhfb3V0cHV0X3Rva2VucyI6ODE5Mn0=' # @param {isTemplate: true}
safety_settings_b64 = "e30="  # @param {isTemplate: true}

gais_contents = json.loads(base64.b64decode(contents_b64))

generation_config = json.loads(base64.b64decode(generation_config_b64))
safety_settings = json.loads(base64.b64decode(safety_settings_b64))

stream = False

# Convert and upload the files

tempfiles = pathlib.Path(f"tempfiles")
tempfiles.mkdir(parents=True, exist_ok=True)


drive = None
def upload_file_data(file_data, index):
    """Upload files to the Files API.

    For each file, Google AI Studio either sent:
    - a Google Drive ID,
    - a URL,
    - a file path, or
    - The raw bytes (`inline_data`).

    The API only understands `inline_data` or it's Files API.
    This code, uploads files to the files API where the API can access them.
    """

    mime_type = file_data["mime_type"]
    if drive_id := file_data.pop("drive_id", None):
        if drive is None:
          from google.colab import drive
          drive.mount("/gdrive")

        path = next(
            pathlib.Path(f"/gdrive/.shortcut-targets-by-id/{drive_id}").glob("*")
        )
        print("Uploading:", str(path))
        file_info = genai.upload_file(path=path, mime_type=mime_type)
        file_data["file_uri"] = file_info.uri
        return

    if url := file_data.pop("url", None):
        response = requests.get(url)
        data = response.content
        name = url.split("/")[-1]
        path = tempfiles / str(index)
        path.write_bytes(data)
        print("Uploading:", url)
        file_info = genai.upload_file(path, display_name=name, mime_type=mime_type)
        file_data["file_uri"] = file_info.uri
        return

    if name := file_data.get("filename", None):
        if not pathlib.Path(name).exists():
            raise IOError(
                f"local file: `{name}` does not exist. You can upload files "
                'to Colab using the file manager ("📁 Files" in the left '
                "toolbar)"
            )
        file_info = genai.upload_file(path, display_name=name, mime_type=mime_type)
        file_data["file_uri"] = file_info.uri
        return

    if "inline_data" in file_data:
        return

    raise ValueError("Either `drive_id`, `url` or `inline_data` must be provided.")


contents = copy.deepcopy(gais_contents)

index = 0
for content in contents:
    for n, part in enumerate(content["parts"]):
        if file_data := part.get("file_data", None):
            upload_file_data(file_data, index)
            index += 1

import json
print(json.dumps(contents, indent=4))

Uploading: https://www.gstatic.com/aistudio/sample-images/object_identifier1.jpg
Uploading: https://www.gstatic.com/aistudio/sample-images/object_identifier2.jpg
Uploading: https://www.gstatic.com/aistudio/sample-images/object_identifier3.jpg
[
    {
        "parts": [
            {
                "text": "What object is this? Describe how it might be used"
            },
            {
                "text": "Object: "
            },
            {
                "file_data": {
                    "mime_type": "image/jpeg",
                    "file_uri": "https://generativelanguage.googleapis.com/v1beta/files/1gx7cm652yin"
                }
            },
            {
                "text": "Description: This is a pipe organ. It is a large musical instrument that is used in churches, concert halls, and other large buildings. It is made up of a series of pipes that are arranged in different sizes and shapes. The pipes are played by pressing keys on a keyboard. When a key is pressed

## Call `generate_content`

In [3]:
from IPython.display import display
from IPython.display import Markdown

# Call the model and print the response.
gemini = genai.GenerativeModel(model_name=model)

response = gemini.generate_content(
    contents,
    generation_config=generation_config,
    safety_settings=safety_settings,
    stream=stream,
)

display(Markdown(response.text))

That's an Allen wrench (also called a hex key).

It's a simple tool used to tighten or loosen screws and bolts that have a hexagonal (six-sided) socket in their heads.  The wrench is inserted into the socket, and then turned to adjust the fastener.  Different sizes of Allen wrenches exist to fit different sizes of hex sockets.


<table class="tfo-notebook-buttons" align="left">
  <td>
    <a target="_blank" href="https://ai.google.dev/gemini-api/docs"><img src="https://ai.google.dev/static/site-assets/images/docs/notebook-site-button.png" height="32" width="32" />Docs on ai.google.dev</a>
  </td>
  <td>
    <a target="_blank" href="https://github.com/google-gemini/cookbook/blob/main/quickstarts"><img src="https://www.tensorflow.org/images/GitHub-Mark-32px.png" />More notebooks in the Cookbook</a>
  </td>
</table>

## [optional] Show the conversation

This section displays the conversation received from Google AI Studio.

In [4]:
# @title Show the conversation, in colab.
import mimetypes

def show_file(file_data):
    mime_type = file_data["mime_type"]

    if drive_id := file_data.get("drive_id", None):
        path = next(
            pathlib.Path(f"/gdrive/.shortcut-targets-by-id/{drive_id}").glob("*")
        )
        name = path
        # data = path.read_bytes()
        kwargs = {"filename": path}
    elif url := file_data.get("url", None):
        name = url
        kwargs = {"url": url}
        # response = requests.get(url)
        # data = response.content
    elif data := file_data.get("inline_data", None):
        name = None
        kwargs = {"data": data}
    elif name := file_data.get("filename", None):
        if not pathlib.Path(name).exists():
            raise IOError(
                f"local file: `{name}` does not exist. You can upload files to "
                'Colab using the file manager ("📁 Files"in the left toolbar)'
            )
    else:
        raise ValueError("Either `drive_id`, `url` or `inline_data` must be provided.")

        print(f"File:\n    name: {name}\n    mime_type: {mime_type}\n")
        return

    format = mimetypes.guess_extension(mime_type).strip(".")
    if mime_type.startswith("image/"):
        image = IPython.display.Image(**kwargs, width=256)
        IPython.display.display(image)
        print()
        return

    if mime_type.startswith("audio/"):
        if len(data) < 2**12:
            audio = IPython.display.Audio(**kwargs)
            IPython.display.display(audio)
            print()
            return

    if mime_type.startswith("video/"):
        if len(data) < 2**12:
            audio = IPython.display.Video(**kwargs, mimetype=mime_type)
            IPython.display.display(audio)
            print()
            return

    print(f"File:\n    name: {name}\n    mime_type: {mime_type}\n")


for content in gais_contents:
    if role := content.get("role", None):
        print("Role:", role, "\n")

    for n, part in enumerate(content["parts"]):
        if text := part.get("text", None):
            print(text, "\n")

        elif file_data := part.get("file_data", None):
            show_file(file_data)

    print("-" * 80, "\n")

What object is this? Describe how it might be used 

Object:  




Description: This is a pipe organ. It is a large musical instrument that is used in churches, concert halls, and other large buildings. It is made up of a series of pipes that are arranged in different sizes and shapes. The pipes are played by pressing keys on a keyboard. When a key is pressed, air is forced through the pipe, which produces a sound. The sound of a pipe organ is very powerful and can be used to create a wide variety of music. 

Object:  




Description: This is a sundial. It is a device that uses the sun's position in the sky to tell the time. The sundial has a flat surface with a hole in the center. A metal rod is placed through the hole and is pointed at the North Star. The shadow of the rod falls on the flat surface and indicates the time. 

Object:  




Description:  

-------------------------------------------------------------------------------- 

