oongaboongahacker
/

Gemini-Nano

Model card Files Files and versions Community

oongaboongahacker

adarshxs commited on Jun 25, 2024

Commit

18258c6

verified ·

1 Parent(s): dd97e5b

Update README.md (#1)

Browse files

- Update README.md (aea9014d3abc793def5bb2a9f53296ca531ad7c1)

Co-authored-by: Adarsh AS <[email protected]>

Files changed (1) hide show

README.md +122 -1

README.md CHANGED Viewed

@@ -13,9 +13,130 @@ The model seems to be of the TFLite model format with the following architecture
 ## Run the model using Mediapipe:
-Follow the instructions here: https://github.com/google-ai-edge/mediapipe-samples/tree/main/examples/llm_inference/js
 ## License
 I dont own shit. Just extracted the model weights stored as a .bin file. https://policies.google.com/terms/generative-ai/use-policy

 ## Run the model using Mediapipe:
+Instructions from here: https://github.com/google-ai-edge/mediapipe-samples/tree/main/examples/llm_inference/js
+In a directory, make two files:
+`index.html`:
+```html
+<!-- Copyright 2024 The MediaPipe Authors.
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+     http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License. -->
+<!doctype html>
+<html lang="en">
+<head>
+    <title>LLM Inference Web Demo</title>
+</head>
+<body>
+    Input:<br />
+    <textarea id="input" style="height: 300px; width: 600px"></textarea><br />
+    <input type="button" id="submit" value="Get Response" disabled /><br />
+    <br />
+    Result:<br />
+    <textarea id="output" style="height: 300px; width: 600px"></textarea>
+    <script type="module" src="index.js"></script>
+</body>
+</html>
+```
+`index.js`(Replace line no. 23 to the path to the .bin file):
+```js
+// Copyright 2024 The MediaPipe Authors.
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//      http://www.apache.org/licenses/LICENSE-2.0
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// ---------------------------------------------------------------------------------------- //
+import {FilesetResolver, LlmInference} from 'https://cdn.jsdelivr.net/npm/@mediapipe/tasks-genai';
+const input = document.getElementById('input');
+const output = document.getElementById('output');
+const submit = document.getElementById('submit');
+const modelFileName = 'weights.bin'; /* PATH TO MODEL .bin */
+/**
+ * Display newly generated partial results to the output text box.
+ */
+function displayPartialResults(partialResults, complete) {
+  output.textContent += partialResults;
+  if (complete) {
+    if (!output.textContent) {
+      output.textContent = 'Result is empty';
+    }
+    submit.disabled = false;
+  }
+}
+/**
+ * Main function to run LLM Inference.
+ */
+async function runDemo() {
+  const genaiFileset = await FilesetResolver.forGenAiTasks(
+      'https://cdn.jsdelivr.net/npm/@mediapipe/tasks-genai/wasm');
+  let llmInference;
+  submit.onclick = () => {
+    output.textContent = '';
+    submit.disabled = true;
+    llmInference.generateResponse(input.value, displayPartialResults);
+  };
+  submit.value = 'Loading the model...'
+  LlmInference
+      .createFromOptions(genaiFileset, {
+        baseOptions: {modelAssetPath: modelFileName},
+        // maxTokens: 512,  // The maximum number of tokens (input tokens + output
+        //                  // tokens) the model handles.
+        // randomSeed: 1,   // The random seed used during text generation.
+        // topK: 1,  // The number of tokens the model considers at each step of
+        //           // generation. Limits predictions to the top k most-probable
+        //           // tokens. Setting randomSeed is required for this to make
+        //           // effects.
+        // temperature:
+        //     1.0,  // The amount of randomness introduced during generation.
+        //           // Setting randomSeed is required for this to make effects.
+      })
+      .then(llm => {
+        llmInference = llm;
+        submit.disabled = false;
+        submit.value = 'Get Response'
+      })
+      .catch(() => {
+        alert('Failed to initialize the task.');
+      });
+}
+runDemo();
+```
+## Run using:
+`python3 -m http.server 8000` in the same directory (or python -m SimpleHTTPServer 8000 for older python versions).
+Finally,
+`Open localhost:8000 in Chrome`
 ## License
 I dont own shit. Just extracted the model weights stored as a .bin file. https://policies.google.com/terms/generative-ai/use-policy