screens/CameraView.js

import React, { useState, useEffect } from "react";
import { isEmpty } from "lodash";
import { Button, Text, View } from "react-native";
import { Camera } from "expo-camera";
import * as tf from "@tensorflow/tfjs";
import * as blazeface from "@tensorflow-models/blazeface";
import "@tensorflow/tfjs-react-native";
import * as Permissions from "expo-permissions";
import {
  cameraWithTensors,
  bundleResourceIO
} from "@tensorflow/tfjs-react-native";

// Helper functions
import { indexOfMax, sumOfArray } from "../helper/HelperFunction";
import styles from "../styles/style";

// Tensor Camera replaces Expo Camera
const TensorCamera = cameraWithTensors(Camera);

// Disable errors on client app
console.disableYellowBox = true;

export default function CameraView() {
  // Variables to make constant predictions on the input frame
  let requestAnimationFrameId = 0;
  let frameCount = 0;
  let makePredictionsEveryNFrames = 1;
  let queueSize = 0;

  const AUTORENDER = true;

  //Loading model from models folder
  const modelJSON = require("../model/model.json");
  const modelWeights = require("../model/group1-shard1of1.bin");

  // Camera view parameters
  const previewLeft = 40;
  const previewTop = 50;
  const previewWidth = 350;
  const previewHeight = 600;

  // Size of the Tensors
  // Fixed to 224,224,3 for input into custom model
  const tensorDims = { height: 224, width: 224, depth: 3 };

  // State
  const [hasPermission, setHasPermission] = useState(null);
  const [blazeFaceModel, setBlazeFaceModel] = useState(null);
  const [textureDimsState, setTextureDims] = useState();
  const [blazeFacePrediction, setBlazeFacePrediction] = useState();
  const [type, setType] = useState(Camera.Constants.Type.front);
  const [modelFaces, setModelFaces] = useState([]);
  const [isTFReady, setTFReady] = useState(false);
  const [loadedModel, setModelLoaded] = useState(null);
  const [modelPrediction, setModelPrediction] = useState();
  const [frameWorkReady, setFrameWorkReady] = useState(false);
  const [finalPrediction, setFinalPrediction] = useState();
  const [predictionReady, setPredictionReady] = useState(false);
  const [allPredictions, setAllPredictions] = useState({
    "0": [],
    "5": [],
    "10": []
  });

  useEffect(() => {
    if (!frameWorkReady) {
      (async () => {
        const { status } = await Camera.requestPermissionsAsync().catch(e =>
          console.log(e)
        );
        if (Platform.OS == "ios") {
          setTextureDims({ height: 1920, width: 1080 });
        } else {
          setTextureDims({ height: 1200, width: 1600 });
        }
        setHasPermission(status === "granted");
        await tf.ready().catch(e => console.log(e));
        setTFReady(true);
        setModelLoaded(await loadModel().catch(e => console.log(e)));
        setBlazeFaceModel(
          await loadBlazeFaceModel().catch(e => console.log(e))
        );
        setFrameWorkReady(true);
      })();
    }
  }, []);

  // Run unMount for cancelling animation if it is running to avoid leaks
  useEffect(() => {
    return () => {
      cancelAnimationFrame(requestAnimationFrameId);
    };
  }, [requestAnimationFrameId]);

  // Use the loaded model to make predictions
  // There are 3 classes that the model will be predicting
  // Class 0: Awareness levels of 0
  // Class 5: Awareness levels of 5
  // Class 10: Awareness levels of 10
  // Pick the prediction class with the highest value

  const getPrediction = async tensor => {
    if (!tensor) {
      console.log("Tensor not found!");
    }
    const bfModel = await blazeFaceModel;
    const returnTensors = true;
    const faces = await bfModel
      .estimateFaces(tensor, returnTensors)
      .catch(e => console.log(e));
    const scale = {
      height: styles.camera.height / tensorDims.height,
      width: styles.camera.width / tensorDims.width
    };

    // Faces is an array of objects
    if (!isEmpty(faces)) {
      setModelFaces({ faces });
      faces.map((face, i) => {
        const { topLeft, bottomRight } = face;
        // Boxes in cropAndResize require to be normalized
        const normTopLeft = topLeft.div(tensor.shape.slice(-3, -2));
        const normBottomRight = bottomRight.div(tensor.shape.slice(-3, -2));
        const width = Math.floor(
          bottomRight.dataSync()[0] - topLeft.dataSync()[0] * scale.width
        );
        const height = Math.floor(
          bottomRight.dataSync()[1] - topLeft.dataSync()[1] * scale.height
        );
        const boxes = tf
          .concat([normTopLeft.dataSync(), normBottomRight.dataSync()])
          .reshape([-1, 4]);
        const crop = tf.image.cropAndResize(
          tensor.reshape([1, 224, 224, 3]),
          boxes,
          [0],
          [height, width]
        );
        // Resize cropped faces to [1,224,224,3]
        const alignCorners = true;
        const imageResize = tf.image.resizeBilinear(
          crop,
          [224, 224],
          alignCorners
        );
        makePrediction(imageResize);
      });
    }
  };
  const makePrediction = async image => {
    if (!image) {
      console.log("No input!");
    }
    const model = await loadedModel;
    const prediction = await model.predict(image, { batchSize: 1 });
    if (!prediction || isEmpty(prediction)) {
      console.log("Prediction not available");
    }
    rollingPrediction(prediction.dataSync());
  };

  // Handling the camera input and converting it into tensors to be used in the
  // model for predictions
  const handleCameraStream = imageAsTensors => {
    if (!imageAsTensors) {
      console.log("Image not found!");
    }
    const loop = async () => {
      if (frameCount % makePredictionsEveryNFrames === 0) {
        const imageTensor = imageAsTensors.next().value;

        if (loadedModel !== null && blazeFaceModel !== null) {
          await getPrediction(imageTensor).catch(e => console.log(e));
        }
        tf.dispose(imageAsTensors);
      }

      frameCount += 1;
      frameCount = frameCount % makePredictionsEveryNFrames;
      requestAnimationFrameId = requestAnimationFrame(loop);
    };
    //loop infinitely to constantly make predictions
    loop();
  };

  // Get the argMax at each frame
  // Store the class
  // Keep a count of each class and its resulting probability
  // Once the total count of the classes object reaches K
  // Select the argMax of the classes object
  // Probability of that class is the sum of all probability for argMax class divided by the len(total probability of argMax class)
  // That is the prediction
  // Set the state to be empty

  const rollingPrediction = arr => {
    const { max, maxIndex } = indexOfMax(arr);
    const maxFixed = parseFloat(max.toFixed(2));
    if (maxIndex === 0) {
      allPredictions["0"].push(maxFixed);
      queueSize += 1;
    } else if (maxIndex === 1) {
      allPredictions["10"].push(maxFixed);
      queueSize += 1;
    } else if (maxIndex === 2) {
      allPredictions["5"].push(maxFixed);
      queueSize += 1;
    }
    if (queueSize > 9) {
      console.log("Queue Size Max");
      const arr1 = allPredictions["0"].length;
      const arr2 = allPredictions["5"].length;
      const arr3 = allPredictions["10"].length;

      console.log(allPredictions);
      if (arr1 > arr2 && arr1 > arr3) {
        const sum = sumOfArray(allPredictions["0"]);
        const prob = sum / arr1;
        setFinalPrediction({ probability: prob, awarenessLevel: 0 });
        setPredictionReady(true);
      } else if (arr2 > arr1 && arr2 > arr3) {
        const sum = sumOfArray(allPredictions["5"]);
        const prob = sum / arr2;
        setFinalPrediction({ probability: prob, awarenessLevel: 5 });
        setPredictionReady(true);
      } else if (arr3 > arr2 && arr3 > arr1) {
        const sum = sumOfArray(allPredictions["10"]);
        const prob = sum / arr3;
        setFinalPrediction({ probability: prob, awarenessLevel: 10 });
        setPredictionReady(true);
      } else {
        console.log("No Rolling Prediction");
      }
      queueSize = 0;
      allPredictions["0"] = [];
      allPredictions["5"] = [];
      allPredictions["10"] = [];
    }
  };
  const predictionAvailable = () => {
    const { probability, awarenessLevel } = finalPrediction;
    return (
      <Text style={styles.awarenessText}>
        Awareness Level :{awarenessLevel} Probability :{probability.toFixed(2)}
      </Text>
    );
  };

  const noPrediction = () => {
    return <Text style={styles.awarenessText}>No prediction available</Text>;
  };

  const renderBoundingBoxes = () => {
    const { faces } = modelFaces;
    const scale = {
      height: styles.camera.height / tensorDims.height,
      width: styles.camera.width / tensorDims.width
    };
    const flipHorizontal = Platform.OS === "ios" ? false : true;
    if (!isEmpty(faces)) {
      return faces.map((face, i) => {
        const { topLeft, bottomRight } = face;
        const bbLeft = topLeft.dataSync()[0] * scale.width;
        const boxStyle = Object.assign({}, styles.bbox, {
          left: flipHorizontal
            ? previewWidth - bbLeft - previewLeft
            : bbLeft + previewLeft,
          top: topLeft.dataSync()[1] * scale.height + 20,
          width:
            (bottomRight.dataSync()[0] - topLeft.dataSync()[0]) * scale.width,
          height:
            (bottomRight.dataSync()[1] - topLeft.dataSync()[1]) * scale.height
        });
        return <View style={boxStyle} key={`faces${i}}`}></View>;
      });
    }
  };

  const renderFacesDebugInfo = () => {
    const { faces } = modelFaces;
    if (!isEmpty(faces)) {
      return faces.map((face, i) => {
        const { topLeft, bottomRight, probability } = face;

        return (
          <Text style={styles.faceDebug} key={`faceInfo${i}`}>
            Probability of being a face: {probability.dataSync()[0].toFixed(3)}{" "}
            | Top Left: [{topLeft.dataSync()[0].toFixed(1)},{" "}
            {topLeft.dataSync()[1].toFixed(1)}] | Bottom Right: [
            {bottomRight.dataSync()[0].toFixed(1)},{" "}
            {bottomRight.dataSync()[1].toFixed(1)}]
          </Text>
        );
      });
    }
  };

  // Load the Blaze Face model to detect the faces in the video

  const loadBlazeFaceModel = async () => {
    const model = await blazeface.load().catch(e => console.log(e));
    console.log("Loaded Blaze Face Model");
    return model;
  };

  // Load the model from the models folder
  const loadModel = async () => {
    const model = await tf
      .loadLayersModel(bundleResourceIO(modelJSON, modelWeights))
      .catch(e => console.log(e));
    console.log("Model loaded!");
    return model;
  };

  if (hasPermission === null) {
    return <View />;
  }
  if (hasPermission === false) {
    return <Text>No access to camera</Text>;
  }

  return (
    <View>
      <View style={styles.cameraContainer}>
        <TensorCamera
          style={styles.camera}
          type={type}
          zoom={0}
          cameraTextureHeight={textureDimsState.height}
          cameraTextureWidth={textureDimsState.width}
          resizeHeight={tensorDims.height}
          resizeWidth={tensorDims.width}
          resizeDepth={tensorDims.depth}
          onReady={imageAsTensors => handleCameraStream(imageAsTensors)}
          autorender={AUTORENDER}
        />
      </View>
      <View>{renderFacesDebugInfo()}</View>
      <View>
        {predictionReady && finalPrediction
          ? predictionAvailable()
          : noPrediction()}
      </View>
      <View style={styles.buttonContainer2}>
        <Button title="Start!" color="green" />
      </View>
    </View>
  );
}