update workflow

This commit is contained in:
Sanju Sivalingam
2026-02-16 21:14:16 +05:30
parent 4848587f0c
commit 2312f8bece
2 changed files with 35 additions and 2 deletions

View File

@@ -3,7 +3,7 @@
"steps": [
{
"app": "com.google.android.apps.bard",
"goal": "Gemini app is now open. Find the text input field and type exactly: 'tell me more about droidclaw.ai' — then tap the send/submit button. Wait for the full response to load completely. Do NOT mark done until you can see the AI has generated a response with actual text content on screen.",
"goal": "Gemini app is now open. Find the text input field and type exactly: 'tell me more about droidclaw.ai' — then look for the send icon button which is located next to the 'fast' button at the bottom of the input area. Tap that send icon to submit the query. Do NOT press enter — you MUST tap the send icon. Wait for the full response to load completely. Do NOT mark done until you can see the AI has generated a response with actual text content on screen.",
"maxSteps": 10
},
{
@@ -12,7 +12,7 @@
},
{
"app": "com.whatsapp",
"goal": "WhatsApp is now open showing the chat list. Look for a contact or chat named 'vi' or 'Vi' in the visible chat list. If you can see it, tap on it to open that chat. If 'vi' is NOT visible in the chat list, tap the search icon (magnifying glass) at the top of the screen, then type 'vi' in the search field, then tap on the matching contact result to open that chat. Do NOT mark done until you are inside the chat conversation with Vi.",
"goal": "WhatsApp is now open showing the chat list. Look for a contact or chat named 'vi' or 'Vi' in the visible chat list. IMPORTANT: When you find the contact, tap on the contact NAME TEXT on the right side of the row — do NOT tap on the profile picture/image on the left side. If 'vi' is NOT visible in the chat list, tap the search icon (magnifying glass) at the top of the screen, then type 'vi' in the search field, then tap on the matching contact name text (not the profile image) to open that chat. Do NOT mark done until you are inside the chat conversation with Vi.",
"maxSteps": 10
},
{

33
test-ollama.ts Normal file
View File

@@ -0,0 +1,33 @@
import OpenAI from "openai";
import { readFileSync } from "fs";
const client = new OpenAI({
baseURL: "http://localhost:11434/v1",
apiKey: "ollama",
});
const imagePath = "/Users/sanju/Downloads/komoot iOS 33.png";
const base64 = readFileSync(imagePath).toString("base64");
console.log("sending image to ollama (gemma3:4b)...\n");
const response = await client.chat.completions.create({
model: "gemma3:4b",
messages: [
{
role: "user",
content: [
{ type: "text", text: "Describe what you see in this screenshot. What app is this? What are the key UI elements?" },
{
type: "image_url",
image_url: { url: `data:image/png;base64,${base64}` },
},
],
},
],
});
console.log("model:", response.model);
console.log("tokens:", response.usage);
console.log("\n--- response ---\n");
console.log(response.choices[0].message.content);