model generation test box takes input prompt from voice transcription box

transcribe voice to text with Whisper base model
install whisper.unity package
2025-12-15 15:57:32 +02:00 · 2025-12-15 15:30:15 +02:00 · 2025-12-15 13:57:07 +02:00 · 2025-12-05 16:58:07 +02:00 · 2025-12-01 17:19:31 +02:00 · 2025-12-01 17:06:42 +02:00
62 changed files with 1655 additions and 111 deletions
--- a/3d-generation-pipeline/.env.example
+++ b/3d-generation-pipeline/.env.example
@@ -0,0 +1,5 @@
+3D_GENERATION_URL=
+MODEL_FOLDER=
+
+CLOUDFLARE_ACCOUNT_ID=
+CLOUDFLARE_API_TOKEN=
--- a/3d-generation-pipeline/.gitignore
+++ b/3d-generation-pipeline/.gitignore
@@ -0,0 +1,7 @@
+.venv
+.env
+__pycache__
+images/
+models/
+logs/
+notebooks/test_resources/
--- a/3d-generation-pipeline/README.md
+++ b/3d-generation-pipeline/README.md
@@ -0,0 +1,6 @@
+### TODO
+* Artikkel text-to-3d prompt engineeringu kohta: "Sel3DCraft: Interactive Visual Prompts for User-Friendly Text-to-3D Generation"
+* TRELLIS: postprocessing_utils: texture baking mode: 'opt' vs 'fast' - hardcoded 'opt', kui võimaldada 'fast' siis tuleb error
+
+### Notes
+* TRELLIS: added functionality to specify texture baking optimisation total steps as an argument (`texture_opt_total_steps`), to replace the hardcoded 2500. But this is not tracked in Git (because modified this https://github.com/IgorAherne/trellis-stable-projectorz/releases/tag/latest)
--- a/3d-generation-pipeline/cloudflare_api.py
+++ b/3d-generation-pipeline/cloudflare_api.py
@@ -0,0 +1,61 @@
+import base64
+import requests
+import os
+
+from dotenv import load_dotenv
+
+load_dotenv()
+ACCOUNT_ID = os.environ["CLOUDFLARE_ACCOUNT_ID"]
+API_TOKEN = os.environ["CLOUDFLARE_API_TOKEN"]
+
+def text_to_image_cloudflare(prompt, output_path):
+    MODEL = "@cf/black-forest-labs/flux-1-schnell"
+    URL = f"https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai/run/{MODEL}"
+
+    payload = {
+        "prompt": prompt,
+    }
+
+    headers = {
+        "Authorization": f"Bearer {API_TOKEN}",
+        "Content-Type": "application/json",
+    }
+
+    resp = requests.post(URL, json=payload, headers=headers, timeout=60)
+    resp.raise_for_status()
+
+    data = resp.json()
+    b64 = data["result"]["image"]
+    if not b64:
+        raise RuntimeError(f"Unexpected response structure: {data}")
+
+    img_bytes = base64.b64decode(b64)
+
+    with open(output_path, "wb") as f:
+        f.write(img_bytes)
+
+    return True
+
+
+def refine_text_prompt(prompt):
+    MODEL = "@cf/meta/llama-3.2-3b-instruct"
+    URL = f"https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai/run/{MODEL}"
+
+    instructions = """
+    User is talking about some object. Your task is to generate a short and concise description of it. Use only user's own words, keep it as short as possible.
+    Example:
+    User: 'Umm, okay, I would like a really cool sword, with for example a bright orange crossguard. And also it should be slightly curved.'
+    You: 'a slightly curved sword with bright orange crossguard'
+    """
+
+    response = requests.post(URL,
+    headers={"Authorization": f"Bearer {API_TOKEN}"},
+    json={
+        "messages": [
+        {"role": "system", "content": instructions},
+        {"role": "user", "content": prompt}
+        ]
+    }
+    )
+    data = response.json()
+    return data["result"]["response"]
--- a/3d-generation-pipeline/generate_image_local.py
+++ b/3d-generation-pipeline/generate_image_local.py
@@ -0,0 +1,86 @@
+import requests
+
+from invokeai_mcp_server import create_text2img_graph, enqueue_graph, wait_for_completion, get_image_url
+from urllib.parse import urljoin
+
+
+INVOKEAI_BASE_URL = "http://127.0.0.1:9090"
+
+
+async def generate_image(arguments: dict):
+
+    # Extract parameters
+    prompt = arguments["prompt"]
+    negative_prompt = arguments.get("negative_prompt", "")
+    width = arguments.get("width", 512)
+    height = arguments.get("height", 512)
+    steps = arguments.get("steps", 30)
+    cfg_scale = arguments.get("cfg_scale", 7.5)
+    scheduler = arguments.get("scheduler", "euler")
+    seed = arguments.get("seed")
+    model_key = arguments.get("model_key")
+    lora_key = arguments.get("lora_key")
+    lora_weight = arguments.get("lora_weight", 1.0)
+    vae_key = arguments.get("vae_key")
+
+    print(f"Generating image with prompt: {prompt[:50]}...")
+
+    # Create graph
+    graph = await create_text2img_graph(
+        prompt=prompt,
+        negative_prompt=negative_prompt,
+        model_key=model_key,
+        lora_key=lora_key,
+        lora_weight=lora_weight,
+        vae_key=vae_key,
+        width=width,
+        height=height,
+        steps=steps,
+        cfg_scale=cfg_scale,
+        scheduler=scheduler,
+        seed=seed
+    )
+
+    # Enqueue and wait for completion
+    result = await enqueue_graph(graph)
+    batch_id = result["batch"]["batch_id"]
+
+    print(f"Enqueued batch {batch_id}, waiting for completion...")
+
+    completed = await wait_for_completion(batch_id)
+
+    # Extract image name from result
+    if "result" in completed and "outputs" in completed["result"]:
+        outputs = completed["result"]["outputs"]
+        # Find the image output
+        for node_id, output in outputs.items():
+            if output.get("type") == "image_output":
+                image_name = output["image"]["image_name"]
+                image_url = await get_image_url(image_name)
+
+                return urljoin(INVOKEAI_BASE_URL, image_url)
+    
+    raise RuntimeError("Failed to generate image!")
+
+def download_file(url, filepath):
+    response = requests.get(url)
+
+    if response.status_code == 200:
+        with open(filepath, "wb") as file:
+            file.write(response.content)
+    else:
+        raise RuntimeError(f"Failed to download image. Status code: {response.status_code}")
+
+
+async def text_to_image_invoke_ai(prompt, output_path):
+    # see available model keys via GET http://127.0.0.1:9090/api/v2/models/?model_type=main
+    args = {
+        "prompt": prompt,
+        "width": 512,
+        "height": 512,
+        "model_key": "79401292-0a6b-428d-b7d7-f1e86caeba2b" # Juggernaut XL v9
+        #"model_key": "735f6485-6703-498f-929e-07cf0bbbd179" # Dreamshaper 8
+    }
+    image_url = await generate_image(args)
+    print("got image url: ", image_url)
+    download_file(image_url, output_path)
--- a/3d-generation-pipeline/generate_model_local.py
+++ b/3d-generation-pipeline/generate_model_local.py
@@ -0,0 +1,97 @@
+import subprocess
+import os
+import time
+import requests
+import base64
+
+from dotenv import load_dotenv
+
+load_dotenv()
+MODEL_FOLDER = os.environ["MODEL_FOLDER"]
+API_URL = os.environ["3D_GENERATION_URL"]
+
+
+def image_to_3d_subprocess(image_path, output_path):
+    venv_python = MODEL_FOLDER + r"\.venv\Scripts\python.exe"
+    script_path = MODEL_FOLDER + r"\run.py"
+
+    args = [image_path, "--output-dir", output_path]
+    command = [venv_python, script_path] + args
+
+    try:
+        # Run the subprocess
+        result = subprocess.run(command, capture_output=True, text=True)
+
+        # Print output and errors
+        print("STDOUT:\n", result.stdout)
+        print("STDERR:\n", result.stderr)
+        print("Return Code:", result.returncode)
+
+    except Exception as e:
+        print(f"Error occurred: {e}")
+
+
+
+def generate_no_preview(image_base64: str):
+    """Generate 3D model from a single base64-encoded image without previews.
+    
+    Args:
+        image_base64: Base64 string of the image (without 'data:image/...' prefix)
+    """
+    try:
+        # Set generation parameters
+        params = {
+            'image_base64': image_base64,
+            'seed': 42,
+            'ss_guidance_strength': 7.5,
+            'ss_sampling_steps': 10,
+            'slat_guidance_strength': 7.5,
+            'slat_sampling_steps': 10,
+            'mesh_simplify_ratio': 0.99,
+            'texture_size': 1024,
+            #'texture_baking_mode': 'opt',
+            'texture_opt_total_steps': 1000,
+            'output_format': 'glb'
+        }
+        
+        # Start generation
+        print("Starting generation...")
+        response = requests.post(f"{API_URL}/generate_no_preview", data=params)
+        response.raise_for_status()
+        
+        # Poll status until complete
+        while True:
+            status = requests.get(f"{API_URL}/status").json()
+            print(f"Progress: {status['progress']}%")
+            
+            if status['status'] == 'COMPLETE':
+                break
+            elif status['status'] == 'FAILED':
+                raise Exception(f"Generation failed: {status['message']}")
+            
+            time.sleep(1)
+        
+        # Download the model
+        print("Downloading model...")
+        response = requests.get(f"{API_URL}/download/model")
+        response.raise_for_status()
+        return response.content
+        
+        
+    except Exception as e:
+        print(f"Error: {str(e)}")
+        return None
+    
+def image_to_3d_api(image_path, output_path):
+    with open(image_path, 'rb') as image_file:
+        image_data = image_file.read()
+
+    base64_encoded = base64.b64encode(image_data).decode('utf-8')
+    model_binary = generate_no_preview(base64_encoded)
+
+    output_file = f"{output_path}.glb"
+    with open(output_file, 'wb') as f:
+        f.write(model_binary)
+
+    return output_file
+    
--- a/3d-generation-pipeline/notebooks/cloudflare_API_test.ipynb
+++ b/3d-generation-pipeline/notebooks/cloudflare_API_test.ipynb
@@ -0,0 +1,153 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "1dc6faae",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import base64\n",
+    "import requests\n",
+    "from dotenv import load_dotenv"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "b3107275",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "load_dotenv()\n",
+    "\n",
+    "ACCOUNT_ID = os.environ[\"CLOUDFLARE_ACCOUNT_ID\"]\n",
+    "API_TOKEN = os.environ[\"CLOUDFLARE_API_TOKEN\"]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "999adf95",
+   "metadata": {},
+   "source": [
+    "## Text to image"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "40b35163",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Saved: test_resources/resolution_test_1.jpg  (315728 bytes)\n"
+     ]
+    }
+   ],
+   "source": [
+    "# https://developers.cloudflare.com/workers-ai/models/flux-1-schnell/\n",
+    "\n",
+    "MODEL = \"@cf/black-forest-labs/flux-1-schnell\"\n",
+    "URL = f\"https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai/run/{MODEL}\"\n",
+    "\n",
+    "payload = {\n",
+    "    \"prompt\": \"cyborg crocodile, realistic style, single object, front and side fully visible, plain neutral background, clear details, soft studio lighting, true-to-scale\",\n",
+    "}\n",
+    "\n",
+    "headers = {\n",
+    "    \"Authorization\": f\"Bearer {API_TOKEN}\",\n",
+    "    \"Content-Type\": \"application/json\",\n",
+    "}\n",
+    "\n",
+    "resp = requests.post(URL, json=payload, headers=headers, timeout=60)\n",
+    "resp.raise_for_status()\n",
+    "\n",
+    "data = resp.json()\n",
+    "b64 = data[\"result\"][\"image\"]\n",
+    "if not b64:\n",
+    "    raise RuntimeError(f\"Unexpected response structure: {data}\")\n",
+    "\n",
+    "img_bytes = base64.b64decode(b64)\n",
+    "\n",
+    "out_path = \"test_resources/resolution_test_1.jpg\"\n",
+    "with open(out_path, \"wb\") as f:\n",
+    "    f.write(img_bytes)\n",
+    "\n",
+    "print(f\"Saved: {out_path}  ({len(img_bytes)} bytes)\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "14a874c4",
+   "metadata": {},
+   "source": [
+    "## Text prompt refinement"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "485f6f46",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\"dark wooden battleaxe with bronze blade\"\n"
+     ]
+    }
+   ],
+   "source": [
+    "MODEL = \"@cf/meta/llama-3.2-3b-instruct\"\n",
+    "URL = f\"https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai/run/{MODEL}\"\n",
+    "\n",
+    "instructions = \"\"\"\n",
+    "User is talking about some object. Your task is to generate a short and concise description of it. Use only user's own words, keep it as short as possible.\n",
+    "Example:\n",
+    "User: 'Umm, okay, I would like a really cool sword, with for example a bright orange crossguard. And also it should be slightly curved.'\n",
+    "You: 'a slightly curved sword with bright orange crossguard'\n",
+    "\"\"\"\n",
+    "prompt = \"Umm, alright, can you please give me an epic battleaxe? It should have a dark wooden shaft and bronze blade.\"\n",
+    "\n",
+    "response = requests.post(URL,\n",
+    "  headers={\"Authorization\": f\"Bearer {API_TOKEN}\"},\n",
+    "  json={\n",
+    "    \"messages\": [\n",
+    "      {\"role\": \"system\", \"content\": instructions},\n",
+    "      {\"role\": \"user\", \"content\": prompt}\n",
+    "    ]\n",
+    "  }\n",
+    ")\n",
+    "data = response.json()\n",
+    "result_text = data[\"result\"][\"response\"]\n",
+    "print(result_text)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/3d-generation-pipeline/notebooks/local_image_generation.ipynb
+++ b/3d-generation-pipeline/notebooks/local_image_generation.ipynb
@@ -0,0 +1,122 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "50e24baa",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from invokeai_mcp_server import create_text2img_graph, enqueue_graph, wait_for_completion, get_image_url\n",
+    "from urllib.parse import urljoin\n",
+    "\n",
+    "import asyncio"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0407cd9a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "INVOKEAI_BASE_URL = \"http://127.0.0.1:9090\"\n",
+    "\n",
+    "\n",
+    "async def generate_image(arguments: dict):\n",
+    "\n",
+    "    # Extract parameters\n",
+    "    prompt = arguments[\"prompt\"]\n",
+    "    negative_prompt = arguments.get(\"negative_prompt\", \"\")\n",
+    "    width = arguments.get(\"width\", 512)\n",
+    "    height = arguments.get(\"height\", 512)\n",
+    "    steps = arguments.get(\"steps\", 30)\n",
+    "    cfg_scale = arguments.get(\"cfg_scale\", 7.5)\n",
+    "    scheduler = arguments.get(\"scheduler\", \"euler\")\n",
+    "    seed = arguments.get(\"seed\")\n",
+    "    model_key = arguments.get(\"model_key\")\n",
+    "    lora_key = arguments.get(\"lora_key\")\n",
+    "    lora_weight = arguments.get(\"lora_weight\", 1.0)\n",
+    "    vae_key = arguments.get(\"vae_key\")\n",
+    "\n",
+    "    #logger.info(f\"Generating image with prompt: {prompt[:50]}...\")\n",
+    "\n",
+    "    # Create graph\n",
+    "    graph = await create_text2img_graph(\n",
+    "        prompt=prompt,\n",
+    "        negative_prompt=negative_prompt,\n",
+    "        model_key=model_key,\n",
+    "        lora_key=lora_key,\n",
+    "        lora_weight=lora_weight,\n",
+    "        vae_key=vae_key,\n",
+    "        width=width,\n",
+    "        height=height,\n",
+    "        steps=steps,\n",
+    "        cfg_scale=cfg_scale,\n",
+    "        scheduler=scheduler,\n",
+    "        seed=seed\n",
+    "    )\n",
+    "\n",
+    "    # Enqueue and wait for completion\n",
+    "    result = await enqueue_graph(graph)\n",
+    "    batch_id = result[\"batch\"][\"batch_id\"]\n",
+    "\n",
+    "    #logger.info(f\"Enqueued batch {batch_id}, waiting for completion...\")\n",
+    "\n",
+    "    completed = await wait_for_completion(batch_id)\n",
+    "\n",
+    "    # Extract image name from result\n",
+    "    if \"result\" in completed and \"outputs\" in completed[\"result\"]:\n",
+    "        outputs = completed[\"result\"][\"outputs\"]\n",
+    "        # Find the image output\n",
+    "        for node_id, output in outputs.items():\n",
+    "            if output.get(\"type\") == \"image_output\":\n",
+    "                image_name = output[\"image\"][\"image_name\"]\n",
+    "                image_url = await get_image_url(image_name)\n",
+    "\n",
+    "                text=f\"Image generated successfully!\\n\\nImage Name: {image_name}\\nImage URL: {image_url}\\n\\nYou can view the image at: {urljoin(INVOKEAI_BASE_URL, f'/api/v1/images/i/{image_name}/full')}\"\n",
+    "                print(text)\n",
+    "\n",
+    "    # Fallback if we couldn't find image output\n",
+    "    #text=f\"Image generation completed but output format was unexpected. Batch ID: {batch_id}\\n\\nResult: {json.dumps(completed, indent=2)}\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6cf9d879",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "async def main():\n",
+    "    args = {\n",
+    "        \"prompt\": \"a golden katana with a fancy pommel\"\n",
+    "    }\n",
+    "    await generate_image(args)\n",
+    "\n",
+    "asyncio.run(main())"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/3d-generation-pipeline/notebooks/local_model_generation_test.ipynb
+++ b/3d-generation-pipeline/notebooks/local_model_generation_test.ipynb
@@ -0,0 +1,152 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "d55eb3ce",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import requests\n",
+    "import base64\n",
+    "import time"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "77b23cd8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# API endpoint\n",
+    "BASE_URL = \"http://127.0.0.1:7960\"\n",
+    "\n",
+    "def generate_no_preview(image_base64: str):\n",
+    "    \"\"\"Generate 3D model from a single base64-encoded image without previews.\n",
+    "    \n",
+    "    Args:\n",
+    "        image_base64: Base64 string of the image (without 'data:image/...' prefix)\n",
+    "    \"\"\"\n",
+    "    try:\n",
+    "        # Set generation parameters\n",
+    "        params = {\n",
+    "            'image_base64': image_base64,\n",
+    "            'seed': 42,\n",
+    "            'ss_guidance_strength': 7.5,\n",
+    "            'ss_sampling_steps': 30,\n",
+    "            'slat_guidance_strength': 7.5,\n",
+    "            'slat_sampling_steps': 30,\n",
+    "            'mesh_simplify_ratio': 0.95,\n",
+    "            'texture_size': 1024,\n",
+    "            'output_format': 'glb'\n",
+    "        }\n",
+    "        \n",
+    "        # Start generation\n",
+    "        print(\"Starting generation...\")\n",
+    "        response = requests.post(f\"{BASE_URL}/generate_no_preview\", data=params)\n",
+    "        print(\"Response status:\", response.status_code)\n",
+    "        response.raise_for_status()\n",
+    "        \n",
+    "        # Poll status until complete\n",
+    "        while True:\n",
+    "            status = requests.get(f\"{BASE_URL}/status\").json()\n",
+    "            print(f\"Progress: {status['progress']}%\")\n",
+    "            \n",
+    "            if status['status'] == 'COMPLETE':\n",
+    "                break\n",
+    "            elif status['status'] == 'FAILED':\n",
+    "                raise Exception(f\"Generation failed: {status['message']}\")\n",
+    "            \n",
+    "            time.sleep(1)\n",
+    "        \n",
+    "        # Download the model\n",
+    "        print(\"Downloading model...\")\n",
+    "        response = requests.get(f\"{BASE_URL}/download/model\")\n",
+    "        response.raise_for_status()\n",
+    "        print(\"Model downloaded.\")\n",
+    "        \n",
+    "        return response.content\n",
+    "        \n",
+    "    except Exception as e:\n",
+    "        print(f\"Error: {str(e)}\")\n",
+    "        return None"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "eb122295",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def generate_model(image_path, output_path):\n",
+    "    with open(image_path, 'rb') as image_file:\n",
+    "        image_data = image_file.read()\n",
+    "\n",
+    "    base64_encoded = base64.b64encode(image_data).decode('utf-8')\n",
+    "    model = generate_no_preview(base64_encoded)\n",
+    "    \n",
+    "    with open(output_path, 'wb') as f:\n",
+    "        f.write(model)\n",
+    "    print(f\"Model saved to {output_path}\")\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "2ce7dfdf",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Starting generation...\n",
+      "Response status: 200\n",
+      "Progress: 100%\n",
+      "Downloading model...\n",
+      "Model downloaded.\n",
+      "Model saved to test_resources/style_test_3_model.glb\n"
+     ]
+    }
+   ],
+   "source": [
+    "\n",
+    "image_path = 'test_resources/style_test_3.jpg'\n",
+    "output_path = \"test_resources/style_test_3_model.glb\"\n",
+    "\n",
+    "generate_model(image_path, output_path)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a1224d13",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/3d-generation-pipeline/notebooks/subprocess_test.ipynb
+++ b/3d-generation-pipeline/notebooks/subprocess_test.ipynb
@@ -0,0 +1,165 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "4826c91d",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'2025-10-18-16-35-47'"
+      ]
+     },
+     "execution_count": 1,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from datetime import datetime\n",
+    "\n",
+    "datetime.now().strftime(\"%Y-%m-%d-%H-%M-%S\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "9419e692",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "STDOUT:\n",
+      " Device used:  cuda\n",
+      "After Remesh 9998 19996\n",
+      "\n",
+      "STDERR:\n",
+      " D:\\users\\henrisel\\stable-fast-3d\\.venv\\lib\\site-packages\\timm\\models\\layers\\__init__.py:48: FutureWarning: Importing from timm.models.layers is deprecated, please import via timm.layers\n",
+      "  warnings.warn(f\"Importing from {__name__} is deprecated, please import via timm.layers\", FutureWarning)\n",
+      "\n",
+      "  0%|          | 0/1 [00:00<?, ?it/s]\n",
+      "  0%|          | 0/1 [00:00<?, ?it/s]\n",
+      "Traceback (most recent call last):\n",
+      "  File \"D:\\users\\henrisel\\stable-fast-3d\\run.py\", line 122, in <module>\n",
+      "    mesh, glob_dict = model.run_image(\n",
+      "  File \"D:\\users\\henrisel\\stable-fast-3d\\sf3d\\system.py\", line 286, in run_image\n",
+      "    meshes, global_dict = self.generate_mesh(\n",
+      "  File \"D:\\users\\henrisel\\stable-fast-3d\\sf3d\\system.py\", line 369, in generate_mesh\n",
+      "    rast = self.baker.rasterize(\n",
+      "  File \"D:\\users\\henrisel\\stable-fast-3d\\.venv\\lib\\site-packages\\texture_baker\\baker.py\", line 28, in rasterize\n",
+      "    return torch.ops.texture_baker_cpp.rasterize(\n",
+      "  File \"D:\\users\\henrisel\\stable-fast-3d\\.venv\\lib\\site-packages\\torch\\_ops.py\", line 1243, in __call__\n",
+      "    return self._op(*args, **kwargs)\n",
+      "NotImplementedError: Could not run 'texture_baker_cpp::rasterize' with arguments from the 'CUDA' backend. This could be because the operator doesn't exist for this backend, or was omitted during the selective/custom build process (if using custom build). If you are a Facebook employee using PyTorch on mobile, please visit https://fburl.com/ptmfixes for possible resolutions. 'texture_baker_cpp::rasterize' is only available for these backends: [CPU, Meta, BackendSelect, Python, FuncTorchDynamicLayerBackMode, Functionalize, Named, Conjugate, Negative, ZeroTensor, ADInplaceOrView, AutogradOther, AutogradCPU, AutogradCUDA, AutogradXLA, AutogradMPS, AutogradXPU, AutogradHPU, AutogradLazy, AutogradMTIA, AutogradMAIA, AutogradMeta, Tracer, AutocastCPU, AutocastMTIA, AutocastMAIA, AutocastXPU, AutocastMPS, AutocastCUDA, FuncTorchBatched, BatchedNestedTensor, FuncTorchVmapMode, Batched, VmapMode, FuncTorchGradWrapper, PythonTLSSnapshot, FuncTorchDynamicLayerFrontMode, PreDispatch, PythonDispatcher].\n",
+      "\n",
+      "CPU: registered at texture_baker\\csrc\\baker.cpp:543 [kernel]\n",
+      "Meta: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\MetaFallbackKernel.cpp:23 [backend fallback]\n",
+      "BackendSelect: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\BackendSelectFallbackKernel.cpp:3 [backend fallback]\n",
+      "Python: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\PythonFallbackKernel.cpp:194 [backend fallback]\n",
+      "FuncTorchDynamicLayerBackMode: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\functorch\\DynamicLayer.cpp:479 [backend fallback]\n",
+      "Functionalize: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\FunctionalizeFallbackKernel.cpp:375 [backend fallback]\n",
+      "Named: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\NamedRegistrations.cpp:7 [backend fallback]\n",
+      "Conjugate: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\ConjugateFallback.cpp:17 [backend fallback]\n",
+      "Negative: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\native\\NegateFallback.cpp:18 [backend fallback]\n",
+      "ZeroTensor: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\ZeroTensorFallback.cpp:86 [backend fallback]\n",
+      "ADInplaceOrView: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:104 [backend fallback]\n",
+      "AutogradOther: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:63 [backend fallback]\n",
+      "AutogradCPU: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:67 [backend fallback]\n",
+      "AutogradCUDA: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:75 [backend fallback]\n",
+      "AutogradXLA: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:87 [backend fallback]\n",
+      "AutogradMPS: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:95 [backend fallback]\n",
+      "AutogradXPU: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:71 [backend fallback]\n",
+      "AutogradHPU: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:108 [backend fallback]\n",
+      "AutogradLazy: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:91 [backend fallback]\n",
+      "AutogradMTIA: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:79 [backend fallback]\n",
+      "AutogradMAIA: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:83 [backend fallback]\n",
+      "AutogradMeta: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\VariableFallbackKernel.cpp:99 [backend fallback]\n",
+      "Tracer: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\torch\\csrc\\autograd\\TraceTypeManual.cpp:294 [backend fallback]\n",
+      "AutocastCPU: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\autocast_mode.cpp:322 [backend fallback]\n",
+      "AutocastMTIA: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\autocast_mode.cpp:466 [backend fallback]\n",
+      "AutocastMAIA: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\autocast_mode.cpp:504 [backend fallback]\n",
+      "AutocastXPU: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\autocast_mode.cpp:542 [backend fallback]\n",
+      "AutocastMPS: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\autocast_mode.cpp:209 [backend fallback]\n",
+      "AutocastCUDA: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\autocast_mode.cpp:165 [backend fallback]\n",
+      "FuncTorchBatched: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\functorch\\LegacyBatchingRegistrations.cpp:731 [backend fallback]\n",
+      "BatchedNestedTensor: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\functorch\\LegacyBatchingRegistrations.cpp:758 [backend fallback]\n",
+      "FuncTorchVmapMode: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\functorch\\VmapModeRegistrations.cpp:27 [backend fallback]\n",
+      "Batched: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\LegacyBatchingRegistrations.cpp:1075 [backend fallback]\n",
+      "VmapMode: fallthrough registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\VmapModeRegistrations.cpp:33 [backend fallback]\n",
+      "FuncTorchGradWrapper: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\functorch\\TensorWrapper.cpp:210 [backend fallback]\n",
+      "PythonTLSSnapshot: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\PythonFallbackKernel.cpp:202 [backend fallback]\n",
+      "FuncTorchDynamicLayerFrontMode: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\functorch\\DynamicLayer.cpp:475 [backend fallback]\n",
+      "PreDispatch: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\PythonFallbackKernel.cpp:206 [backend fallback]\n",
+      "PythonDispatcher: registered at C:\\actions-runner\\_work\\pytorch\\pytorch\\pytorch\\aten\\src\\ATen\\core\\PythonFallbackKernel.cpp:198 [backend fallback]\n",
+      "\n",
+      "\n",
+      "Return Code: 1\n"
+     ]
+    }
+   ],
+   "source": [
+    "import subprocess\n",
+    "\n",
+    "MODEL_FOLDER = r\"D:\\users\\henrisel\\stable-fast-3d\"\n",
+    "PROJECT_FOLDER = r\"D:\\users\\henrisel\\DeltaVR3DModelGeneration\\3d-generation-pipeline\"\n",
+    "\n",
+    "# Path to the Python interpreter in the other virtual environment\n",
+    "venv_python = MODEL_FOLDER + r\"\\.venv\\Scripts\\python.exe\"\n",
+    "\n",
+    "# Path to the .py file you want to run\n",
+    "script_path = MODEL_FOLDER + r\"\\run.py\"\n",
+    "\n",
+    "# Optional: arguments to pass to the script\n",
+    "args = [MODEL_FOLDER + r\"\\demo_files\\examples\\chair1.png\", \"--output-dir\", PROJECT_FOLDER + r\"\\images\"]\n",
+    "\n",
+    "# Build the command\n",
+    "command = [venv_python, script_path] + args\n",
+    "\n",
+    "try:\n",
+    "    # Run the subprocess\n",
+    "    result = subprocess.run(command, capture_output=True, text=True)\n",
+    "\n",
+    "    # Print output and errors\n",
+    "    print(\"STDOUT:\\n\", result.stdout)\n",
+    "    print(\"STDERR:\\n\", result.stderr)\n",
+    "    print(\"Return Code:\", result.returncode)\n",
+    "\n",
+    "except Exception as e:\n",
+    "    print(f\"Error occurred: {e}\")\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ee480ba6",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/3d-generation-pipeline/requirements.txt
+++ b/3d-generation-pipeline/requirements.txt
@@ -0,0 +1,7 @@
+#torch==2.8.0+cu129 https://pytorch.org/get-started/previous-versions/
+transformers==4.57.0
+git+https://github.com/huggingface/diffusers.git
+accelerate==1.10.1
+huggingface_hub[hf_xet]==1.1.10
+sentencepiece==0.2.1
+protobuf==6.32.1
--- a/3d-generation-pipeline/start_pipeline.py
+++ b/3d-generation-pipeline/start_pipeline.py
@@ -0,0 +1,62 @@
+import argparse
+import asyncio
+import logging
+import time
+
+from pathlib import Path
+from datetime import datetime
+from dotenv import load_dotenv
+
+from generate_image_local import text_to_image_invoke_ai
+from generate_model_local import image_to_3d_api
+
+load_dotenv()
+
+
+def get_timestamp():
+    return datetime.now().strftime("%Y-%m-%d-%H-%M-%S")
+
+def setup_logger(base_folder, timestamp):
+    log_dir = base_folder / Path("logs")
+    log_dir.mkdir(parents=True, exist_ok=True)
+    logging.basicConfig(
+        filename=log_dir / f"{timestamp}.log",
+        level=logging.INFO,
+        force=True
+    )
+
+
+async def main():
+    parser = argparse.ArgumentParser(description="Text to 3D model pipeline")
+    parser.add_argument("--prompt", type=str, required=True, help="User text prompt")
+    args = parser.parse_args()
+
+    input_prompt = args.prompt
+    print(f"Input prompt: {input_prompt}")
+    image_generation_prompt = input_prompt + ", realistic style, single object, front and side fully visible, plain neutral background, clear details, soft studio lighting, true-to-scale"
+    
+    pipeline_folder = Path(__file__).resolve().parent
+    timestamp = get_timestamp()
+    setup_logger(pipeline_folder, timestamp)
+    time_checkpoint = time.time()
+
+    image_path = pipeline_folder / "images" / f"{timestamp}.jpg"
+    # TODO: use Invoke AI or Cloudflare, depending on env var
+    #text_to_image_cloudflare(image_generation_prompt, image_path)
+    await text_to_image_invoke_ai(image_generation_prompt, image_path)
+    
+    image_generation_time = time.time() - time_checkpoint
+    time_checkpoint = time.time()
+    logging.info(f"Image generation time: {round(image_generation_time, 1)} s")
+    print(f"Generated image file: {image_path}")
+
+    model_path = pipeline_folder / "models" / timestamp
+    model_file = image_to_3d_api(image_path, model_path)
+
+    model_generation_time = time.time() - time_checkpoint
+    logging.info(f"Model generation time: {round(model_generation_time, 1)} s")
+    print(f"Generated 3D model file: {model_file}")
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
--- a/Assets/StreamingAssets/Whisper.meta
+++ b/Assets/StreamingAssets/Whisper.meta
@@ -0,0 +1,8 @@
+fileFormatVersion: 2
+guid: 23fe3883e9cc804429bc54fb860d18f1
+folderAsset: yes
+DefaultImporter:
+  externalObjects: {}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/StreamingAssets/Whisper/ggml-base.bin
+++ b/Assets/StreamingAssets/Whisper/ggml-base.bin
--- a/Assets/StreamingAssets/Whisper/ggml-base.bin.meta
+++ b/Assets/StreamingAssets/Whisper/ggml-base.bin.meta
@@ -0,0 +1,7 @@
+fileFormatVersion: 2
+guid: f6c028f06eda5904eae3f7a7418b8416
+DefaultImporter:
+  externalObjects: {}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Components/Bolt/Lexus2016RXTireNormal.png.png.meta
+++ b/Assets/_PROJECT/Components/Bolt/Lexus2016RXTireNormal.png.png.meta
@@ -7,7 +7,7 @@ TextureImporter:
  mipmaps:
    mipMapMode: 0
    enableMipMap: 1
-    sRGBTexture: 1
+    sRGBTexture: 0
    linearTexture: 0
    fadeOut: 0
    borderMipMap: 0
@@ -54,7 +54,7 @@ TextureImporter:
  alphaUsage: 1
  alphaIsTransparency: 0
  spriteTessellationDetail: -1
-  textureType: 0
+  textureType: 1
  textureShape: 1
  singleChannelComponent: 0
  flipbookRows: 1
--- a/Assets/_PROJECT/Components/Bow/Scripts/ArcheryRange.cs
+++ b/Assets/_PROJECT/Components/Bow/Scripts/ArcheryRange.cs
@@ -1,6 +1,7 @@
 using System;
 using System.Collections.Generic;
 using System.Linq;
+using System.Threading.Tasks;
 using _PROJECT.Scripts.Bow;
 using FishNet.Object;
 using FishNet.Object.Synchronizing;
@@ -36,6 +37,8 @@ public class ArcheryRange : NetworkBehaviour
    private float _nextTargetTime;
    private bool _roundActive;

+    private string targetModelName;
+
    private readonly List<XROrigin> _presentPlayers = new();

    private XROrigin _scoredPlayer;
@@ -112,27 +115,32 @@ public class ArcheryRange : NetworkBehaviour
        }
    }

-    private void SpawnTarget()
+    async private void SpawnTarget()
    {
        if (!IsServer) return;
        
        var randomPos = targetStartPosition.position + new Vector3(
            Random.Range(minRandomOffset.x, maxRandomOffset.x),
-            (float)Math.Round(Random.Range(minRandomOffset.y, maxRandomOffset.y)),
-            Random.Range(minRandomOffset.z, maxRandomOffset.z));
-
-        var target = SpawnTarget(randomPos);
+            (float) Math.Round(Random.Range(minRandomOffset.y, maxRandomOffset.y)),
+            Random.Range(minRandomOffset.z, maxRandomOffset.z)
+        );

+        var target = await SpawnTarget(randomPos);
        _targets.Add(target);
    }

-    private ArcheryTarget SpawnTarget(Vector3 randomPos)
+    async private Task<ArcheryTarget> SpawnTarget(Vector3 randomPos)
    {
-        var prefab = Instantiate(targetPrefab, randomPos, Quaternion.identity, null);
-        ArcheryTarget target = prefab.GetComponent<ArcheryTarget>();
+        var targetObject = Instantiate(targetPrefab, randomPos, Quaternion.identity, null);
+        GameObject targetReplacement = await PipelineManager.Instance.SpawnModel(targetModelName);
+        // TODO: replace target prefab's child with the generated model
+        targetReplacement.transform.parent = targetObject.transform;
+        targetReplacement.transform.position = targetObject.transform.position;
+
+        ArcheryTarget target = targetObject.GetComponent<ArcheryTarget>();
        target.endPosition = targetEndPosition.position;
        target.addScore = AddScore;
-        Spawn(prefab);
+        Spawn(targetObject);
        return target;
    }

@@ -148,7 +156,7 @@ public class ArcheryRange : NetworkBehaviour
        _targets = new List<ArcheryTarget>();
        if (_maxScore < _score) _maxScore = _score;

-        if(_presentPlayers.Count != 0) // If there are players in the area.
+        if (_presentPlayers.Count != 0) // If there are players in the area.
        {
            // Gives the score to the player longest-lasting in the area. It would be better to give it to the player that fired the starting arrow, but I'm not spending 10 hours on this. 

@@ -175,9 +183,12 @@ public class ArcheryRange : NetworkBehaviour
        SetTimeLeftText("");
    }

-    public void StartRound()
+    async public void StartRound()
    {
        if (!IsServer) return;
+
+        targetModelName = await PipelineManager.Instance.GenerateModelAsync("unicorn with golden horn and long fluffy tail and butterfly wings");
+
        _roundEndTime = Time.time + roundLength;
        _nextTargetTime = Time.time;
        _roundActive = true;
--- a/Assets/_PROJECT/Components/Bow/Scripts/ArcheryTarget.cs
+++ b/Assets/_PROJECT/Components/Bow/Scripts/ArcheryTarget.cs
@@ -1,10 +1,7 @@
 using System;
-using _PROJECT.Scripts.Bow;
-using _PROJECT.Scripts.Bow.Extra;
 using FishNet.Object;
 using FishNet.Object.Synchronizing;
 using UnityEngine;
-using Random = UnityEngine.Random;

 public class ArcheryTarget : NetworkBehaviour, IArrowHittable
 {
@@ -13,12 +10,10 @@ public class ArcheryTarget : NetworkBehaviour, IArrowHittable
    public Vector3 endPosition;
    public float forwardSpeed = 2f;
    public Action<float> addScore;
-    
-    private bool _flipDirection;

    private void Awake()
    {
-        _flipDirection = Random.value > 0.5f;
+        
    }

    // Update is called once per frame
@@ -28,11 +23,12 @@ public class ArcheryTarget : NetworkBehaviour, IArrowHittable
        float step = forwardSpeed * Time.deltaTime;
        var position = transform.position;

-        if (Math.Abs(position.x - endPosition.x) < 0.1) Destroy(gameObject);
+        if (Math.Abs(position.x - endPosition.x) < 0.1)
+        {
+            Destroy(gameObject);
+        }

-        
-        transform.position = Vector3.MoveTowards(position,
-            new Vector3(endPosition.x, position.y, position.z), step);
+        transform.position = Vector3.MoveTowards(position, new Vector3(endPosition.x, position.y, position.z), step);
    }

    public void Hit(Arrow arrow)
--- a/Assets/_PROJECT/Materials/Green.mat
+++ b/Assets/_PROJECT/Materials/Green.mat
@@ -0,0 +1,133 @@
+%YAML 1.1
+%TAG !u! tag:unity3d.com,2011:
+--- !u!21 &2100000
+Material:
+  serializedVersion: 8
+  m_ObjectHideFlags: 0
+  m_CorrespondingSourceObject: {fileID: 0}
+  m_PrefabInstance: {fileID: 0}
+  m_PrefabAsset: {fileID: 0}
+  m_Name: Green
+  m_Shader: {fileID: 4800000, guid: 933532a4fcc9baf4fa0491de14d08ed7, type: 3}
+  m_Parent: {fileID: 0}
+  m_ModifiedSerializedProperties: 0
+  m_ValidKeywords: []
+  m_InvalidKeywords: []
+  m_LightmapFlags: 4
+  m_EnableInstancingVariants: 0
+  m_DoubleSidedGI: 0
+  m_CustomRenderQueue: -1
+  stringTagMap:
+    RenderType: Opaque
+  disabledShaderPasses: []
+  m_LockedProperties: 
+  m_SavedProperties:
+    serializedVersion: 3
+    m_TexEnvs:
+    - _BaseMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _BumpMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _DetailAlbedoMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _DetailMask:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _DetailNormalMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _EmissionMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _MainTex:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _MetallicGlossMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _OcclusionMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _ParallaxMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _SpecGlossMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - unity_Lightmaps:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - unity_LightmapsInd:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - unity_ShadowMasks:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    m_Ints: []
+    m_Floats:
+    - _AlphaClip: 0
+    - _AlphaToMask: 0
+    - _Blend: 0
+    - _BlendModePreserveSpecular: 1
+    - _BumpScale: 1
+    - _ClearCoatMask: 0
+    - _ClearCoatSmoothness: 0
+    - _Cull: 2
+    - _Cutoff: 0.5
+    - _DetailAlbedoMapScale: 1
+    - _DetailNormalMapScale: 1
+    - _DstBlend: 0
+    - _DstBlendAlpha: 0
+    - _EnvironmentReflections: 1
+    - _GlossMapScale: 0
+    - _Glossiness: 0
+    - _GlossyReflections: 0
+    - _Metallic: 0
+    - _OcclusionStrength: 1
+    - _Parallax: 0.005
+    - _QueueOffset: 0
+    - _ReceiveShadows: 1
+    - _Smoothness: 0.5
+    - _SmoothnessTextureChannel: 0
+    - _SpecularHighlights: 1
+    - _SrcBlend: 1
+    - _SrcBlendAlpha: 1
+    - _Surface: 0
+    - _WorkflowMode: 1
+    - _ZWrite: 1
+    m_Colors:
+    - _BaseColor: {r: 0, g: 1, b: 0.0381248, a: 1}
+    - _Color: {r: 0, g: 1, b: 0.0381248, a: 1}
+    - _EmissionColor: {r: 0, g: 0, b: 0, a: 1}
+    - _SpecColor: {r: 0.19999996, g: 0.19999996, b: 0.19999996, a: 1}
+  m_BuildTextureStacks: []
+--- !u!114 &6221994712197478572
+MonoBehaviour:
+  m_ObjectHideFlags: 11
+  m_CorrespondingSourceObject: {fileID: 0}
+  m_PrefabInstance: {fileID: 0}
+  m_PrefabAsset: {fileID: 0}
+  m_GameObject: {fileID: 0}
+  m_Enabled: 1
+  m_EditorHideFlags: 0
+  m_Script: {fileID: 11500000, guid: d0353a89b1f911e48b9e16bdc9f2e058, type: 3}
+  m_Name: 
+  m_EditorClassIdentifier: 
+  version: 7
--- a/Assets/_PROJECT/Materials/Green.mat.meta
+++ b/Assets/_PROJECT/Materials/Green.mat.meta
@@ -0,0 +1,8 @@
+fileFormatVersion: 2
+guid: 937c5f357ed270843bd43d1f7d5d475b
+NativeFormatImporter:
+  externalObjects: {}
+  mainObjectFileID: 2100000
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Materials/Red.mat
+++ b/Assets/_PROJECT/Materials/Red.mat
@@ -0,0 +1,133 @@
+%YAML 1.1
+%TAG !u! tag:unity3d.com,2011:
+--- !u!114 &-7093071968994914494
+MonoBehaviour:
+  m_ObjectHideFlags: 11
+  m_CorrespondingSourceObject: {fileID: 0}
+  m_PrefabInstance: {fileID: 0}
+  m_PrefabAsset: {fileID: 0}
+  m_GameObject: {fileID: 0}
+  m_Enabled: 1
+  m_EditorHideFlags: 0
+  m_Script: {fileID: 11500000, guid: d0353a89b1f911e48b9e16bdc9f2e058, type: 3}
+  m_Name: 
+  m_EditorClassIdentifier: 
+  version: 7
+--- !u!21 &2100000
+Material:
+  serializedVersion: 8
+  m_ObjectHideFlags: 0
+  m_CorrespondingSourceObject: {fileID: 0}
+  m_PrefabInstance: {fileID: 0}
+  m_PrefabAsset: {fileID: 0}
+  m_Name: Red
+  m_Shader: {fileID: 4800000, guid: 933532a4fcc9baf4fa0491de14d08ed7, type: 3}
+  m_Parent: {fileID: 0}
+  m_ModifiedSerializedProperties: 0
+  m_ValidKeywords: []
+  m_InvalidKeywords: []
+  m_LightmapFlags: 4
+  m_EnableInstancingVariants: 0
+  m_DoubleSidedGI: 0
+  m_CustomRenderQueue: -1
+  stringTagMap:
+    RenderType: Opaque
+  disabledShaderPasses: []
+  m_LockedProperties: 
+  m_SavedProperties:
+    serializedVersion: 3
+    m_TexEnvs:
+    - _BaseMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _BumpMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _DetailAlbedoMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _DetailMask:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _DetailNormalMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _EmissionMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _MainTex:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _MetallicGlossMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _OcclusionMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _ParallaxMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - _SpecGlossMap:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - unity_Lightmaps:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - unity_LightmapsInd:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    - unity_ShadowMasks:
+        m_Texture: {fileID: 0}
+        m_Scale: {x: 1, y: 1}
+        m_Offset: {x: 0, y: 0}
+    m_Ints: []
+    m_Floats:
+    - _AlphaClip: 0
+    - _AlphaToMask: 0
+    - _Blend: 0
+    - _BlendModePreserveSpecular: 1
+    - _BumpScale: 1
+    - _ClearCoatMask: 0
+    - _ClearCoatSmoothness: 0
+    - _Cull: 2
+    - _Cutoff: 0.5
+    - _DetailAlbedoMapScale: 1
+    - _DetailNormalMapScale: 1
+    - _DstBlend: 0
+    - _DstBlendAlpha: 0
+    - _EnvironmentReflections: 1
+    - _GlossMapScale: 0
+    - _Glossiness: 0
+    - _GlossyReflections: 0
+    - _Metallic: 0
+    - _OcclusionStrength: 1
+    - _Parallax: 0.005
+    - _QueueOffset: 0
+    - _ReceiveShadows: 1
+    - _Smoothness: 0.5
+    - _SmoothnessTextureChannel: 0
+    - _SpecularHighlights: 1
+    - _SrcBlend: 1
+    - _SrcBlendAlpha: 1
+    - _Surface: 0
+    - _WorkflowMode: 1
+    - _ZWrite: 1
+    m_Colors:
+    - _BaseColor: {r: 1, g: 0, b: 0, a: 1}
+    - _Color: {r: 1, g: 0, b: 0, a: 1}
+    - _EmissionColor: {r: 0, g: 0, b: 0, a: 1}
+    - _SpecColor: {r: 0.19999996, g: 0.19999996, b: 0.19999996, a: 1}
+  m_BuildTextureStacks: []
--- a/Assets/_PROJECT/Materials/Red.mat.meta
+++ b/Assets/_PROJECT/Materials/Red.mat.meta
@@ -0,0 +1,8 @@
+fileFormatVersion: 2
+guid: 707a698b0ec80454a8c68700bca72941
+NativeFormatImporter:
+  externalObjects: {}
+  mainObjectFileID: 2100000
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Scenes/DeltaBuilding_base.unity
+++ b/Assets/_PROJECT/Scenes/DeltaBuilding_base.unity
--- a/Assets/_PROJECT/Scripts/3DModeGeneration.meta
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration.meta
@@ -0,0 +1,8 @@
+fileFormatVersion: 2
+guid: 0ec3982ba49c4b84ea95332cb090e115
+folderAsset: yes
+DefaultImporter:
+  externalObjects: {}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Scripts/3DModeGeneration/ModelGenerationTestBox.cs
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration/ModelGenerationTestBox.cs
@@ -0,0 +1,52 @@
+using UnityEngine;
+
+public class ModelGenerationTestBox : MonoBehaviour
+{
+    public Material activeMaterial;
+    public Material inactiveMaterial;
+    public Transform modelSpawnPoint;
+    public VoiceTranscriptionTestBox voiceTranscriptionTestBox;
+
+    private MeshRenderer meshRenderer;
+
+
+    // Start is called before the first frame update
+    void Start()
+    {
+        meshRenderer = GetComponent<MeshRenderer>();
+    }
+
+    // Update is called once per frame
+    void Update()
+    {
+        
+    }
+
+    async void OnTriggerEnter(Collider other)
+    {
+        KbmController controller = other.GetComponent<KbmController>();
+        if (controller != null)
+        {
+            meshRenderer.material = activeMaterial;
+
+            string inputPrompt = voiceTranscriptionTestBox.currentTextOutput;
+            string modelPath = await PipelineManager.Instance.GenerateModelAsync(inputPrompt);
+            //LoadModel("D:\\henrisel\\DeltaVR3DModelGeneration\\3d-generation-pipeline\\models\\2025-11-17-16-13-33\\mesh.glb");
+            GameObject spawnedObject = await PipelineManager.Instance.SpawnModel(modelPath);
+            spawnedObject.transform.parent = modelSpawnPoint;
+            spawnedObject.transform.position = modelSpawnPoint.position;
+        }
+    }
+
+    private void OnTriggerExit(Collider other)
+    {
+        KbmController controller = other.GetComponent<KbmController>();
+        if (controller != null)
+        {
+            meshRenderer.material = inactiveMaterial;
+        }
+    }
+
+
+    
+}
--- a/Assets/_PROJECT/Scripts/3DModeGeneration/ModelGenerationTestBox.cs.meta
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration/ModelGenerationTestBox.cs.meta
@@ -0,0 +1,11 @@
+fileFormatVersion: 2
+guid: 46e67223dce9b7a4783ed36b8ed65f19
+MonoImporter:
+  externalObjects: {}
+  serializedVersion: 2
+  defaultReferences: []
+  executionOrder: 0
+  icon: {instanceID: 0}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Scripts/3DModeGeneration/PipelineManager.cs
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration/PipelineManager.cs
@@ -0,0 +1,104 @@
+using GLTFast;
+using System.Diagnostics;
+using System.Threading.Tasks;
+using UnityEngine;
+
+public class PipelineManager : MonoBehaviour
+{
+    public static PipelineManager Instance { get; private set; }
+
+    private void Awake()
+    {
+        Instance = this;
+    }
+
+    // Start is called before the first frame update
+    void Start()
+    {
+        
+    }
+
+    // Update is called once per frame
+    void Update()
+    {
+        
+    }
+
+    public async Task<string> GenerateModelAsync(string inputPrompt)
+    {
+        return await Task.Run(() =>
+        {
+            // Path to your virtual environment's python.exe
+            string pythonExe = @"D:\users\henrisel\DeltaVR3DModelGeneration\3d-generation-pipeline\.venv\Scripts\python.exe";
+
+            // Path to your Python script
+            string scriptPath = @"D:\users\henrisel\DeltaVR3DModelGeneration\3d-generation-pipeline\start_pipeline.py";
+
+            // Arguments to pass to the script
+            string arguments = $"{scriptPath} --prompt \"{inputPrompt}\"";
+
+            ProcessStartInfo psi = new ProcessStartInfo
+            {
+                FileName = pythonExe,
+                Arguments = arguments,
+                UseShellExecute = false,
+                RedirectStandardOutput = true,
+                RedirectStandardError = true,
+                CreateNoWindow = true
+            };
+
+            using (Process process = new Process())
+            {
+                process.StartInfo = psi;
+                process.OutputDataReceived += (sender, e) => UnityEngine.Debug.Log(e.Data);
+                process.ErrorDataReceived += (sender, e) => UnityEngine.Debug.LogError(e.Data);
+
+                process.Start();
+
+                string output = process.StandardOutput.ReadToEnd();
+                string error = process.StandardError.ReadToEnd();
+
+                process.WaitForExit();
+
+
+                // Extract model path from output
+                foreach (string line in output.Split('\n'))
+                {
+                    if (line.StartsWith("Generated 3D model file: "))
+                    {
+                        return line.Replace("Generated 3D model file: ", "").Trim();
+                    }
+                }
+
+                throw new System.Exception("Failed to generate 3D model!");
+            }
+        });
+    }
+
+    public async Task<GameObject> SpawnModel(string modelPath)
+    {
+        var gltf = new GltfImport();
+        bool loadSuccess = await gltf.Load(modelPath);
+        if (loadSuccess)
+        {
+            GameObject spawnedObject = new GameObject("spawned model");
+
+            bool spawnSuccess = await gltf.InstantiateMainSceneAsync(spawnedObject.transform);
+            if (spawnSuccess)
+            {
+                Transform spawnedObjectMainTransform = spawnedObject.transform.GetChild(0).transform;
+                GameObject spawnedObjectBody = spawnedObjectMainTransform.GetChild(0).transform.gameObject;
+                MeshCollider collider = spawnedObjectBody.AddComponent<MeshCollider>();
+                collider.convex = true;
+                MeshRenderer renderer = spawnedObjectBody.GetComponent<MeshRenderer>();
+                renderer.material.SetFloat("metallicFactor", 0);
+
+                spawnedObjectMainTransform.gameObject.AddComponent<Rigidbody>();
+
+                return spawnedObject;
+            }
+        }
+
+        throw new System.Exception("Failed to spawn GameObject from model" + modelPath);
+    }
+}
--- a/Assets/_PROJECT/Scripts/3DModeGeneration/PipelineManager.cs.meta
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration/PipelineManager.cs.meta
@@ -0,0 +1,11 @@
+fileFormatVersion: 2
+guid: 19e82e42c38cf2d4b912baa8d60c5407
+MonoImporter:
+  externalObjects: {}
+  serializedVersion: 2
+  defaultReferences: []
+  executionOrder: 0
+  icon: {instanceID: 0}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Scripts/3DModeGeneration/VoiceTranscriptionTestBox.cs
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration/VoiceTranscriptionTestBox.cs
@@ -0,0 +1,94 @@
+using System.Diagnostics;
+using TMPro;
+using UnityEngine;
+using Whisper;
+using Whisper.Utils;
+
+public class VoiceTranscriptionTestBox : MonoBehaviour
+{
+    public Material activeMaterial;
+    public Material inactiveMaterial;
+
+    private MeshRenderer meshRenderer;
+
+
+    public WhisperManager whisper;
+    public MicrophoneRecord microphoneRecord;
+    public TextMeshProUGUI outputText;
+
+    private string _buffer;
+    public string currentTextOutput;
+
+    private void Awake()
+    {
+        whisper.OnNewSegment += OnNewSegment;
+        whisper.OnProgress += OnProgressHandler;
+
+        microphoneRecord.OnRecordStop += OnRecordStop;
+    }
+
+    // Start is called before the first frame update
+    void Start()
+    {
+        meshRenderer = GetComponent<MeshRenderer>();
+    }
+
+    // Update is called once per frame
+    void Update()
+    {
+        
+    }
+
+    void OnTriggerEnter(Collider other)
+    {
+        KbmController controller = other.GetComponent<KbmController>();
+        if (controller != null)
+        {
+            meshRenderer.material = activeMaterial;
+            microphoneRecord.StartRecord();
+        }
+    }
+
+    private void OnTriggerExit(Collider other)
+    {
+        KbmController controller = other.GetComponent<KbmController>();
+        if (controller != null)
+        {
+            meshRenderer.material = inactiveMaterial;
+            microphoneRecord.StopRecord();
+        }
+    }
+
+
+    private async void OnRecordStop(AudioChunk recordedAudio)
+    {
+        _buffer = "";
+
+        var sw = new Stopwatch();
+        sw.Start();
+
+        var res = await whisper.GetTextAsync(recordedAudio.Data, recordedAudio.Frequency, recordedAudio.Channels);
+        if (res == null)
+            return;
+
+        var time = sw.ElapsedMilliseconds;
+        var rate = recordedAudio.Length / (time * 0.001f);
+        UnityEngine.Debug.Log($"Time: {time} ms\nRate: {rate:F1}x");
+
+        var text = res.Result;
+
+        currentTextOutput = text;
+        outputText.text = text;
+    }
+
+    private void OnProgressHandler(int progress)
+    {
+        UnityEngine.Debug.Log($"Progress: {progress}%");
+    }
+
+    private void OnNewSegment(WhisperSegment segment)
+    {
+        _buffer += segment.Text;
+        UnityEngine.Debug.Log(_buffer + "...");
+    }
+}
--- a/Assets/_PROJECT/Scripts/3DModeGeneration/VoiceTranscriptionTestBox.cs.meta
+++ b/Assets/_PROJECT/Scripts/3DModeGeneration/VoiceTranscriptionTestBox.cs.meta
@@ -0,0 +1,11 @@
+fileFormatVersion: 2
+guid: d28857190597d9a46a8ddf3cf902cc81
+MonoImporter:
+  externalObjects: {}
+  serializedVersion: 2
+  defaultReferences: []
+  executionOrder: 0
+  icon: {instanceID: 0}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Assets/_PROJECT/Scripts/Audio/VoiceTranscription.cs
+++ b/Assets/_PROJECT/Scripts/Audio/VoiceTranscription.cs
@@ -0,0 +1,57 @@
+using System.Diagnostics;
+using UnityEngine;
+using Whisper;
+using Whisper.Utils;
+
+public class VoiceTranscription : MonoBehaviour
+{
+    public WhisperManager whisper;
+    public MicrophoneRecord microphoneRecord;
+
+    private string _buffer;
+
+    private void Awake()
+    {
+        whisper.OnNewSegment += OnNewSegment;
+
+        microphoneRecord.OnRecordStop += OnRecordStop;
+    }
+
+    // Start is called before the first frame update
+    void Start()
+    {
+        
+    }
+
+    // Update is called once per frame
+    void Update()
+    {
+        
+    }
+
+    private async void OnRecordStop(AudioChunk recordedAudio)
+    {
+        _buffer = "";
+
+        var sw = new Stopwatch();
+        sw.Start();
+
+        var res = await whisper.GetTextAsync(recordedAudio.Data, recordedAudio.Frequency, recordedAudio.Channels);
+        if (res == null)
+            return;
+
+        var time = sw.ElapsedMilliseconds;
+        var rate = recordedAudio.Length / (time * 0.001f);
+        UnityEngine.Debug.Log($"Time: {time} ms\nRate: {rate:F1}x");
+
+        var text = res.Result;
+
+        UnityEngine.Debug.Log(text);
+    }
+
+    private void OnNewSegment(WhisperSegment segment)
+    {
+        _buffer += segment.Text;
+        UnityEngine.Debug.Log(_buffer + "...");
+    }
+}
--- a/Assets/_PROJECT/Scripts/Audio/VoiceTranscription.cs.meta
+++ b/Assets/_PROJECT/Scripts/Audio/VoiceTranscription.cs.meta
@@ -0,0 +1,11 @@
+fileFormatVersion: 2
+guid: af83274dbfe8bab4599dda694e2545c2
+MonoImporter:
+  externalObjects: {}
+  serializedVersion: 2
+  defaultReferences: []
+  executionOrder: 0
+  icon: {instanceID: 0}
+  userData: 
+  assetBundleName: 
+  assetBundleVariant: 
--- a/Doc/clips/Bolt-Car-Network-Problem-Clip.gif
+++ b/Doc/clips/Bolt-Car-Network-Problem-Clip.gif
--- a/Doc/clips/Bolt-Car-Network-Results-Clip.gif
+++ b/Doc/clips/Bolt-Car-Network-Results-Clip.gif
--- a/Doc/clips/Camera-Collider-Clip.gif
+++ b/Doc/clips/Camera-Collider-Clip.gif
--- a/Doc/clips/Door-Collision-Solution-Clip.gif
+++ b/Doc/clips/Door-Collision-Solution-Clip.gif
--- a/Doc/clips/Door-Grabbing-Clip.gif
+++ b/Doc/clips/Door-Grabbing-Clip.gif
--- a/Doc/clips/Doors-Issue-Clip.gif
+++ b/Doc/clips/Doors-Issue-Clip.gif
--- a/Doc/clips/Elevator-Move-Between-Floors-Clip.gif
+++ b/Doc/clips/Elevator-Move-Between-Floors-Clip.gif
--- a/Doc/clips/Elevator-Open-Close-Doors-Clip.gif
+++ b/Doc/clips/Elevator-Open-Close-Doors-Clip.gif
--- a/Doc/clips/Elevator-network-problem-Clip.gif
+++ b/Doc/clips/Elevator-network-problem-Clip.gif
--- a/Doc/clips/Elevator-network-results-Clip.gif
+++ b/Doc/clips/Elevator-network-results-Clip.gif
--- a/Doc/clips/Ghost-Hand-Clip.gif
+++ b/Doc/clips/Ghost-Hand-Clip.gif
--- a/Doc/clips/Hand-Collider-Prototype-Clip.gif
+++ b/Doc/clips/Hand-Collider-Prototype-Clip.gif
--- a/Doc/clips/Open-Elevator-Doors-Same-Floor-Clip.gif
+++ b/Doc/clips/Open-Elevator-Doors-Same-Floor-Clip.gif
--- a/Doc/clips/Player-Hand-Collision-Complete-Clip.gif
+++ b/Doc/clips/Player-Hand-Collision-Complete-Clip.gif
--- a/Doc/clips/Summon-Elevator-Clip.gif
+++ b/Doc/clips/Summon-Elevator-Clip.gif
--- a/Doc/clips/VR-Elevator-Example-Clip.gif
+++ b/Doc/clips/VR-Elevator-Example-Clip.gif
--- a/Doc/designs/Doorknob-Rework-Blender.png
+++ b/Doc/designs/Doorknob-Rework-Blender.png
--- a/Doc/designs/Doorknob-Rework-Unity.png
+++ b/Doc/designs/Doorknob-Rework-Unity.png
--- a/Doc/designs/Elevator-buttons-inside.png
+++ b/Doc/designs/Elevator-buttons-inside.png
--- a/Doc/designs/Model-Collider-Rework-Concept.png
+++ b/Doc/designs/Model-Collider-Rework-Concept.png
--- a/Doc/designs/Moder-Collider-Rework-Results.png
+++ b/Doc/designs/Moder-Collider-Rework-Results.png
--- a/Doc/designs/Network-Player-mirror.png
+++ b/Doc/designs/Network-Player-mirror.png
--- a/Doc/designs/Old-VR-Doorknob.png
+++ b/Doc/designs/Old-VR-Doorknob.png
--- a/Doc/designs/Original-elevator-state-diagram.png
+++ b/Doc/designs/Original-elevator-state-diagram.png
--- a/Doc/designs/Player-Hand-Colliders.png
+++ b/Doc/designs/Player-Hand-Colliders.png
--- a/Doc/designs/Real-Doorknob.jpg
+++ b/Doc/designs/Real-Doorknob.jpg
--- a/Doc/designs/Two-Elevators.png
+++ b/Doc/designs/Two-Elevators.png
--- a/Packages/manifest.json
+++ b/Packages/manifest.json
@@ -4,6 +4,7 @@
    "com.unity.2d.tilemap": "1.0.0",
    "com.unity.ai.navigation": "1.1.1",
    "com.unity.cinemachine": "2.9.5",
+    "com.unity.cloud.gltfast": "6.14.1",
    "com.unity.collab-proxy": "2.0.1",
    "com.unity.ext.nunit": "1.0.6",
    "com.unity.feature.vr": "1.0.0",
@@ -27,6 +28,7 @@
    "com.unity.xr.mock-hmd": "1.3.1-preview.1",
    "com.unity.xr.oculus": "3.2.3",
    "com.unity.xr.openxr": "1.7.0",
+    "com.whisper.unity": "https://github.com/Macoron/whisper.unity.git?path=/Packages/com.whisper.unity",
    "com.unity.modules.ai": "1.0.0",
    "com.unity.modules.androidjni": "1.0.0",
    "com.unity.modules.animation": "1.0.0",
--- a/Packages/packages-lock.json
+++ b/Packages/packages-lock.json
@@ -31,11 +31,12 @@
      "url": "https://packages.unity.com"
    },
    "com.unity.burst": {
-      "version": "1.8.3",
+      "version": "1.8.24",
      "depth": 1,
      "source": "registry",
      "dependencies": {
-        "com.unity.mathematics": "1.2.1"
+        "com.unity.mathematics": "1.2.1",
+        "com.unity.modules.jsonserialize": "1.0.0"
      },
      "url": "https://packages.unity.com"
    },
@@ -48,6 +49,19 @@
      },
      "url": "https://packages.unity.com"
    },
+    "com.unity.cloud.gltfast": {
+      "version": "6.14.1",
+      "depth": 0,
+      "source": "registry",
+      "dependencies": {
+        "com.unity.burst": "1.8.24",
+        "com.unity.collections": "1.2.4",
+        "com.unity.mathematics": "1.2.6",
+        "com.unity.modules.jsonserialize": "1.0.0",
+        "com.unity.modules.unitywebrequest": "1.0.0"
+      },
+      "url": "https://packages.unity.com"
+    },
    "com.unity.collab-proxy": {
      "version": "2.0.1",
      "depth": 0,
@@ -55,6 +69,16 @@
      "dependencies": {},
      "url": "https://packages.unity.com"
    },
+    "com.unity.collections": {
+      "version": "1.2.4",
+      "depth": 1,
+      "source": "registry",
+      "dependencies": {
+        "com.unity.burst": "1.6.6",
+        "com.unity.test-framework": "1.1.31"
+      },
+      "url": "https://packages.unity.com"
+    },
    "com.unity.editorcoroutines": {
      "version": "1.0.0",
      "depth": 1,
@@ -364,6 +388,13 @@
      },
      "url": "https://packages.unity.com"
    },
+    "com.whisper.unity": {
+      "version": "https://github.com/Macoron/whisper.unity.git?path=/Packages/com.whisper.unity",
+      "depth": 0,
+      "source": "git",
+      "dependencies": {},
+      "hash": "529a628a915a97799e89e061af9cb7c71407124d"
+    },
    "com.unity.modules.ai": {
      "version": "1.0.0",
      "depth": 0,
--- a/README.md
+++ b/README.md
@@ -66,17 +66,23 @@ Multiplayer and cross-play functionality. [Bachelor's Thesis](https://comserv.cs
 **Raimond Tunnel**<br/>
 Project management, visual design.

-**Timur Nizamov**<br/>
-Technical sound design.
-
 Developed in the [Computer Graphcis and Virtual Reality Study Lab](https://cgvr.cs.ut.ee/) of the [Institute of Computer Science, University of Tartu](https://cs.ut.ee).

 ### Used Attributions

 | Description                                         | License                                      | Source                                                                                      | Author           |
 |-----------------------------------------------------|----------------------------------------------|---------------------------------------------------------------------------------------------|------------------|
+| Bold's car driving sound                            | Attribution NonCommercial 3.0                | [Link](https://freesound.org/people/Pfujimoto/sounds/14371/)                               | Pfujimoto        |
+| Bold's car braking sound                            | Attribution 3.0                              | [Link](https://freesound.org/people/200154michaela/sounds/542448/)                         | 200154michaela   |
+| Bold's car horn sound                               | Attribution 4.0                              | [Link](https://freesound.org/people/ceberation/sounds/235506/)                             | ceberation       |
 | Server rack model                                   | Royalty Free, No AI License                  | [Link](https://www.cgtrader.com/free-3d-models/electronics/computer/simple-server-model)   | anymelok         |
+| Server rack humming sound                           | Attribution 4.0                              | [Link](https://freesound.org/people/jameswrowles/sounds/248217/)                           | jameswrowles     |
+| Fire suppression button press sound                 | Creative Commons 0                           | [Link](https://freesound.org/people/LamaMakesMusic/sounds/403556/)                         | LamaMakesMusic   |
+| Fire suppression alarm sound                        | Attribution 3.0                              | [Link](https://freesound.org/people/jobro/sounds/33737/)                                   | jobro            |
+| Fire-suppressing gas release sound                  | Creative Commons 0                           | [Link](https://freesound.org/people/mrmccormack/sounds/182359/)                            | mrmccormack      |
+| Coughing sound in response to fire-suppressing gas  | Attribution 4.0                              | [Link](https://freesound.org/people/qubodup/sounds/739416/)                                | qubodup          |
 | Robot movement sound                                | Creative Commons 0                           | [Link](https://freesound.org/people/Brazilio123/sounds/661435/)                            | Brazilio123      |
+| Portal humming sound                                | Attribution 4.0                              | [Link](https://freesound.org/people/zimbot/sounds/122972/)                                 | zimbot           |
 | Spacewalk UFO sound                                 | Attribution NonCommercial 4.0                           | [Link](https://freesound.org/people/Speedenza/sounds/209366/)                           | Speedenza     |
 | Keyboard icons                                      | Creative Commons Attribution-NoDerivs 3.0    | [Link](https://icons8.com/)                                                                 | icons8           |
Author	SHA1	Message	Date
henrisel	7be20d249e	model generation test box takes input prompt from voice transcription box	2025-12-15 15:57:32 +02:00
henrisel	9c7536d1d4	transcribe voice to text with Whisper base model	2025-12-15 15:30:15 +02:00
henrisel	0c026078d0	install whisper.unity package	2025-12-15 13:57:07 +02:00
henrisel	843bd141eb	test different art styles, change pipeline prompt	2025-12-05 16:58:07 +02:00
henrisel	408949e5c2	WIP: spawn generated model as archery range target	2025-12-01 17:19:31 +02:00
henrisel	40e273f51e	refactored model generation code out of test box into separate pipeline manager	2025-12-01 17:06:42 +02:00
henrisel	a66cb8f62c	fix prompt	2025-11-28 15:29:00 +02:00
henrisel	cc3c481295	try out different text-to-img and img-to-3d params	2025-11-28 15:27:37 +02:00
henrisel	2980631414	decrease texture baking optimisation total steps	2025-11-21 16:30:56 +02:00
henrisel	c15ae24c7a	tune 3d generation params	2025-11-21 14:39:16 +02:00
henrisel	7f02dccc6b	use SD-XL model for img gen in pipeline	2025-11-21 12:57:53 +02:00
henrisel	34a6c50598	clean up code + prompt engineering for image generation	2025-11-21 11:39:36 +02:00
henrisel	191c9e66fe	fix metallic property when spawning object	2025-11-21 10:32:15 +02:00
henrisel	d7fec73c77	added logging to file	2025-11-14 09:53:30 +02:00
henrisel	590c62eadd	incorporate InvokeAI into start_pipeline.py	2025-11-12 17:51:02 +02:00
henrisel	fdd4ff827e	reimplement function from invokeai_mcp_server to make requests to local InvokeAI	2025-11-10 18:19:16 +02:00
henrisel	d2e1c7b56f	fix networking UI again + tweaks to pipeline script	2025-11-07 16:56:34 +02:00
henrisel	09f764c0df	integrate local trellis api into start_pipeline.py	2025-11-07 16:22:13 +02:00
henrisel	447449e1b3	local TRELLIS API test notebook	2025-11-07 14:54:41 +02:00
henrisel	d43408cf01	move pipeline starter in map	2025-11-05 18:02:06 +02:00
henrisel	9bfc55f2d6	add glTFast package + load in model after pipeline generation	2025-11-05 17:54:48 +02:00
Henri Sellis	1b0d9fd0b0	pipeline script passes generated model filepath to Unity	2025-11-02 17:20:41 +02:00
Henri Sellis	f8ca8570af	fix network manager (again)	2025-11-02 16:06:36 +02:00
henrisel	e25f1c75b5	update env example	2025-10-24 13:34:24 +03:00
henrisel	c5c40f58ab	Cube that starts generation pipeline on collision	2025-10-24 12:00:27 +03:00
Henri Sellis	2971027af2	fix start game UI	2025-10-24 10:22:53 +03:00
Henri Sellis	34a23ab94d	make 3d model generation model folder loc configurable	2025-10-24 10:03:16 +03:00
Henri Sellis	8b3965d0b1	generated images and models into gitignore	2025-10-24 09:49:24 +03:00
henrisel	42d7c0059b	Add TODO Azure OpenAI API	2025-10-21 14:32:19 +00:00
Henri Sellis	6413d5a3d6	start pipeline script dynamically calculates absolute paths	2025-10-20 16:37:02 +03:00
Henri Sellis	e4f9423ca6	passing user prompt to pipeline script as cmd argument	2025-10-19 12:17:34 +03:00
Henri Sellis	1bb878848f	combined pipeline running function	2025-10-18 16:44:38 +03:00
Henri Sellis	ae497eac6e	test local text-to-image models and cloudflare API	2025-10-18 16:06:54 +03:00
Henri Sellis	2cf0a9f711	start of 3d generation pipelines	2025-10-11 18:37:46 +03:00