{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some kwargs in processor config are unused and will not have any effect: time_horizon, action_dim, min_token, vocab_size, scale. \n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "os.sys.path.append(\"..\")\n",
    "\n",
    "import numpy as np\n",
    "from fast_tokenizer.processing_action_tokenizer import UniversalActionProcessor\n",
    "\n",
    "model_name_or_path = \"/inspire/ssd/ws-f4d69b29-e0a5-44e6-bd92-acf4de9990f0/public-project/public/yjc/cunxin/hf_cache/hub/models--physical-intelligence--fast/snapshots/ec4d7aa71691cac0b8bed6942be45684db2110f4\"\n",
    "\n",
    "tokenizer = UniversalActionProcessor.from_pretrained(model_name_or_path, trust_remote_code=True)\n",
    "action_data = np.random.rand(1, 1, 14)    # one batch of action chunks\n",
    "tokens = tokenizer(action_data)              # tokens = list[int]\n",
    "decoded_actions = tokenizer.decode(tokens)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "10\n",
      "action_data: [[0.80190911 0.04257572 0.62646499 0.01949756 0.64449236 0.90472229\n",
      "  0.03461226 0.5177021  0.29303347 0.36162611 0.0491308  0.7966445\n",
      "  0.77543698 0.64167579]]\n",
      "tokens: [302, 437, 437, 303, 402, 701, 545, 1431]\n",
      "decoded_actions: [[0.8 0.  0.6 0.  0.6 0.9 0.  0.5 0.3 0.4 0.  0.8 0.8 0.6]]\n"
     ]
    }
   ],
   "source": [
    "print(tokenizer.scale)\n",
    "print(\"action_data:\", action_data[0])\n",
    "print(\"tokens:\", tokens[0])\n",
    "print(\"decoded_actions:\", decoded_actions[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle\n",
    "with open(\"../vla-scripts/output_embeds.pkl\", \"rb\") as f:\n",
    "    output_embeds = pickle.load(f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(tensor([-0.0036,  0.0033, -0.0068,  ...,  0.0056, -0.0082,  0.0069],\n",
       "        device='cuda:1', grad_fn=<SelectBackward0>),\n",
       " tensor([-0.0315,  0.0465, -0.0017,  ..., -0.0204,  0.0169,  0.0333],\n",
       "        device='cuda:1', grad_fn=<SelectBackward0>))"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "output_embeds[0], output_embeds[1]"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "vima",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.21"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
