Add package to hub

2026-04-14 10:22:37 +08:00 · 2022-05-08 06:47:12 +05:30
parent 6a7f65563c
commit c97b23b726
1 changed files with 401 additions and 22 deletions
--- a/unit1/unit1_bonus/Wandb
+++ b/unit1/unit1_bonus/Wandb
@@ -10,12 +10,12 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 7,
   "id": "2e020e33",
   "metadata": {
    "ExecuteTime": {
-     "end_time": "2022-05-07T16:36:51.138888Z",
-     "start_time": "2022-05-07T16:36:49.643694Z"
+     "end_time": "2022-05-08T01:11:29.835785Z",
+     "start_time": "2022-05-08T01:11:29.831878Z"
    }
   },
   "outputs": [],
@@ -28,7 +28,7 @@
    "from stable_baselines3.common.evaluation import evaluate_policy\n",
    "from stable_baselines3.common.env_util import make_vec_env\n",
    "\n",
-    "from stable_baselines3.common.vec_env import VecVideoRecorder\n",
+    "from stable_baselines3.common.vec_env import VecVideoRecorder , DummyVecEnv\n",
    "\n",
    "# Import wandb stuff\n",
    "import wandb\n",
@@ -81,8 +81,8 @@
   "id": "ae0fd212",
   "metadata": {
    "ExecuteTime": {
-     "end_time": "2022-05-07T16:36:59.329343Z",
-     "start_time": "2022-05-07T16:36:53.808583Z"
+     "end_time": "2022-05-08T00:55:11.285850Z",
+     "start_time": "2022-05-08T00:55:05.640088Z"
    }
   },
   "outputs": [
@@ -108,7 +108,7 @@
    {
     "data": {
      "text/html": [
-       "Run data is saved locally in <code>/home/venom/Desktop/deep-rl-class/unit1/unit1_bonus/wandb/run-20220507_220654-8czogswz</code>"
+       "Run data is saved locally in <code>/home/venom/Desktop/deep-rl-class/unit1/unit1_bonus/wandb/run-20220508_062506-2ovixu73</code>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -120,7 +120,7 @@
    {
     "data": {
      "text/html": [
-       "Syncing run <strong><a href=\"https://wandb.ai/supersecurehuman/LunarLander-v2/runs/8czogswz\" target=\"_blank\">brisk-fire-2</a></strong> to <a href=\"https://wandb.ai/supersecurehuman/LunarLander-v2\" target=\"_blank\">Weights & Biases</a> (<a href=\"https://wandb.me/run\" target=\"_blank\">docs</a>)<br/>"
+       "Syncing run <strong><a href=\"https://wandb.ai/supersecurehuman/LunarLander-v2/runs/2ovixu73\" target=\"_blank\">warm-gorge-3</a></strong> to <a href=\"https://wandb.ai/supersecurehuman/LunarLander-v2\" target=\"_blank\">Weights & Biases</a> (<a href=\"https://wandb.me/run\" target=\"_blank\">docs</a>)<br/>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -138,6 +138,7 @@
    "    \"policy_type\": \"MlpPolicy\",\n",
    "    \"total_timesteps\": 100000,\n",
    "    \"env_name\": \"LunarLander-v2\",\n",
+    "    \"learning_rate\" : 0.0002,\n",
    "}\n",
    "\n",
    "run = wandb.init(\n",
@@ -166,8 +167,8 @@
   "id": "0b8046ae",
   "metadata": {
    "ExecuteTime": {
-     "end_time": "2022-05-07T16:37:34.011591Z",
-     "start_time": "2022-05-07T16:37:29.500555Z"
+     "end_time": "2022-05-08T00:55:59.965683Z",
+     "start_time": "2022-05-08T00:55:55.396867Z"
    }
   },
   "outputs": [
@@ -185,29 +186,126 @@
    "# be pretty resource intensive. \n",
    "# env = VecVideoRecorder(env, f\"videos/{run.id}\", record_video_trigger=lambda x: x % 2000 == 0, video_length=200) # Set the video recorder, to record our agent during training\n",
    "\n",
+    "# I would suggest you to add all your hyperparameters in the config dictionary defined before the wandb init step. This would help you to visualize the effect those hyper parameters\n",
+    "# have on your model, via the wandb dashboard\n",
    "model = PPO(\n",
    "    policy = config[\"policy_type\"],\n",
    "    env = env,\n",
+    "    learning_rate=config[\"learning_rate\"],\n",
    "    tensorboard_log=\"logs\",\n",
    "    verbose=1)"
   ]
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
   "id": "f772cc3f",
   "metadata": {
    "ExecuteTime": {
-     "end_time": "2022-05-07T16:39:54.654747Z",
-     "start_time": "2022-05-07T16:37:35.052748Z"
+     "end_time": "2022-05-08T00:59:14.354142Z",
+     "start_time": "2022-05-08T00:56:32.259913Z"
    },
    "scrolled": true
   },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Logging to logs/PPO_1\n",
+      "---------------------------------\n",
+      "| rollout/           |          |\n",
+      "|    ep_len_mean     | 91.1     |\n",
+      "|    ep_rew_mean     | -170     |\n",
+      "| time/              |          |\n",
+      "|    fps             | 5432     |\n",
+      "|    iterations      | 1        |\n",
+      "|    time_elapsed    | 6        |\n",
+      "|    total_timesteps | 32768    |\n",
+      "---------------------------------\n",
+      "-----------------------------------------\n",
+      "| rollout/                |             |\n",
+      "|    ep_len_mean          | 98.9        |\n",
+      "|    ep_rew_mean          | -132        |\n",
+      "| time/                   |             |\n",
+      "|    fps                  | 1480        |\n",
+      "|    iterations           | 2           |\n",
+      "|    time_elapsed         | 44          |\n",
+      "|    total_timesteps      | 65536       |\n",
+      "| train/                  |             |\n",
+      "|    approx_kl            | 0.009069282 |\n",
+      "|    clip_fraction        | 0.0836      |\n",
+      "|    clip_range           | 0.2         |\n",
+      "|    entropy_loss         | -1.38       |\n",
+      "|    explained_variance   | 0.00211     |\n",
+      "|    learning_rate        | 0.0002      |\n",
+      "|    loss                 | 345         |\n",
+      "|    n_updates            | 10          |\n",
+      "|    policy_gradient_loss | -0.00783    |\n",
+      "|    value_loss           | 810         |\n",
+      "-----------------------------------------\n",
+      "-----------------------------------------\n",
+      "| rollout/                |             |\n",
+      "|    ep_len_mean          | 103         |\n",
+      "|    ep_rew_mean          | -104        |\n",
+      "| time/                   |             |\n",
+      "|    fps                  | 1135        |\n",
+      "|    iterations           | 3           |\n",
+      "|    time_elapsed         | 86          |\n",
+      "|    total_timesteps      | 98304       |\n",
+      "| train/                  |             |\n",
+      "|    approx_kl            | 0.012206479 |\n",
+      "|    clip_fraction        | 0.12        |\n",
+      "|    clip_range           | 0.2         |\n",
+      "|    entropy_loss         | -1.35       |\n",
+      "|    explained_variance   | 0.436       |\n",
+      "|    learning_rate        | 0.0002      |\n",
+      "|    loss                 | 77.5        |\n",
+      "|    n_updates            | 20          |\n",
+      "|    policy_gradient_loss | -0.0125     |\n",
+      "|    value_loss           | 335         |\n",
+      "-----------------------------------------\n",
+      "-----------------------------------------\n",
+      "| rollout/                |             |\n",
+      "|    ep_len_mean          | 113         |\n",
+      "|    ep_rew_mean          | -87.2       |\n",
+      "| time/                   |             |\n",
+      "|    fps                  | 1031        |\n",
+      "|    iterations           | 4           |\n",
+      "|    time_elapsed         | 127         |\n",
+      "|    total_timesteps      | 131072      |\n",
+      "| train/                  |             |\n",
+      "|    approx_kl            | 0.012416394 |\n",
+      "|    clip_fraction        | 0.167       |\n",
+      "|    clip_range           | 0.2         |\n",
+      "|    entropy_loss         | -1.31       |\n",
+      "|    explained_variance   | 0.513       |\n",
+      "|    learning_rate        | 0.0002      |\n",
+      "|    loss                 | 66.1        |\n",
+      "|    n_updates            | 30          |\n",
+      "|    policy_gradient_loss | -0.015      |\n",
+      "|    value_loss           | 257         |\n",
+      "-----------------------------------------\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "<stable_baselines3.ppo.ppo.PPO at 0x7fb0d70ccd50>"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
   "source": [
    "# Now we do the magical stuff of logging to wandb. All you have to do is add the wandb callback to the model's callback like this\n",
    "\n",
-    "model.learn(total_timesteps=config[\"total_timesteps\"], callback=[WandbCallback()])"
+    "model.learn(total_timesteps=config[\"total_timesteps\"], \n",
+    "            callback=[WandbCallback(\n",
+    "                gradient_save_freq=100\n",
+    "            )])"
   ]
  },
  {
@@ -216,8 +314,8 @@
   "id": "d2a6341c",
   "metadata": {
    "ExecuteTime": {
-     "end_time": "2022-05-07T16:40:06.824067Z",
-     "start_time": "2022-05-07T16:39:54.696684Z"
+     "end_time": "2022-05-08T00:59:27.663456Z",
+     "start_time": "2022-05-08T00:59:14.382414Z"
    }
   },
   "outputs": [
@@ -255,7 +353,7 @@
       "    .wandb-row { display: flex; flex-direction: row; flex-wrap: wrap; justify-content: flex-start; width: 100% }\n",
       "    .wandb-col { display: flex; flex-direction: column; flex-basis: 100%; flex: 1; padding: 10px; }\n",
       "    </style>\n",
-       "<div class=\"wandb-row\"><div class=\"wandb-col\"><h3>Run history:</h3><br/><table class=\"wandb\"><tr><td>global_step</td><td>▁▃▆█</td></tr><tr><td>rollout/ep_len_mean</td><td>▁▃▄█</td></tr><tr><td>rollout/ep_rew_mean</td><td>▁▄▆█</td></tr><tr><td>time/fps</td><td>█▁▁▁</td></tr><tr><td>train/approx_kl</td><td>▁▇█</td></tr><tr><td>train/clip_fraction</td><td>▁▅█</td></tr><tr><td>train/clip_range</td><td>▁▁▁</td></tr><tr><td>train/entropy_loss</td><td>▁▄█</td></tr><tr><td>train/explained_variance</td><td>▁▇█</td></tr><tr><td>train/learning_rate</td><td>▁▁▁</td></tr><tr><td>train/loss</td><td>█▅▁</td></tr><tr><td>train/policy_gradient_loss</td><td>█▄▁</td></tr><tr><td>train/value_loss</td><td>█▂▁</td></tr></table><br/></div><div class=\"wandb-col\"><h3>Run summary:</h3><br/><table class=\"wandb\"><tr><td>global_step</td><td>131072</td></tr><tr><td>rollout/ep_len_mean</td><td>107.59</td></tr><tr><td>rollout/ep_rew_mean</td><td>-75.28564</td></tr><tr><td>time/fps</td><td>1176.0</td></tr><tr><td>train/approx_kl</td><td>0.01353</td></tr><tr><td>train/clip_fraction</td><td>0.20614</td></tr><tr><td>train/clip_range</td><td>0.2</td></tr><tr><td>train/entropy_loss</td><td>-1.30999</td></tr><tr><td>train/explained_variance</td><td>0.65612</td></tr><tr><td>train/learning_rate</td><td>0.0003</td></tr><tr><td>train/loss</td><td>44.55813</td></tr><tr><td>train/policy_gradient_loss</td><td>-0.01972</td></tr><tr><td>train/value_loss</td><td>212.05472</td></tr></table><br/></div></div>"
+       "<div class=\"wandb-row\"><div class=\"wandb-col\"><h3>Run history:</h3><br/><table class=\"wandb\"><tr><td>global_step</td><td>▁▃▆█</td></tr><tr><td>rollout/ep_len_mean</td><td>▁▃▅█</td></tr><tr><td>rollout/ep_rew_mean</td><td>▁▄▇█</td></tr><tr><td>time/fps</td><td>█▂▁▁</td></tr><tr><td>train/approx_kl</td><td>▁██</td></tr><tr><td>train/clip_fraction</td><td>▁▄█</td></tr><tr><td>train/clip_range</td><td>▁▁▁</td></tr><tr><td>train/entropy_loss</td><td>▁▄█</td></tr><tr><td>train/explained_variance</td><td>▁▇█</td></tr><tr><td>train/learning_rate</td><td>▁▁▁</td></tr><tr><td>train/loss</td><td>█▁▁</td></tr><tr><td>train/policy_gradient_loss</td><td>█▃▁</td></tr><tr><td>train/value_loss</td><td>█▂▁</td></tr></table><br/></div><div class=\"wandb-col\"><h3>Run summary:</h3><br/><table class=\"wandb\"><tr><td>global_step</td><td>131072</td></tr><tr><td>rollout/ep_len_mean</td><td>113.48</td></tr><tr><td>rollout/ep_rew_mean</td><td>-87.24881</td></tr><tr><td>time/fps</td><td>1031.0</td></tr><tr><td>train/approx_kl</td><td>0.01242</td></tr><tr><td>train/clip_fraction</td><td>0.16663</td></tr><tr><td>train/clip_range</td><td>0.2</td></tr><tr><td>train/entropy_loss</td><td>-1.30755</td></tr><tr><td>train/explained_variance</td><td>0.51275</td></tr><tr><td>train/learning_rate</td><td>0.0002</td></tr><tr><td>train/loss</td><td>66.06168</td></tr><tr><td>train/policy_gradient_loss</td><td>-0.01496</td></tr><tr><td>train/value_loss</td><td>257.38614</td></tr></table><br/></div></div>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -267,7 +365,7 @@
    {
     "data": {
      "text/html": [
-       "Synced <strong style=\"color:#cdcd00\">brisk-fire-2</strong>: <a href=\"https://wandb.ai/supersecurehuman/LunarLander-v2/runs/8czogswz\" target=\"_blank\">https://wandb.ai/supersecurehuman/LunarLander-v2/runs/8czogswz</a><br/>Synced 6 W&B file(s), 0 media file(s), 0 artifact file(s) and 1 other file(s)"
+       "Synced <strong style=\"color:#cdcd00\">warm-gorge-3</strong>: <a href=\"https://wandb.ai/supersecurehuman/LunarLander-v2/runs/2ovixu73\" target=\"_blank\">https://wandb.ai/supersecurehuman/LunarLander-v2/runs/2ovixu73</a><br/>Synced 6 W&B file(s), 0 media file(s), 0 artifact file(s) and 1 other file(s)"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -279,7 +377,7 @@
    {
     "data": {
      "text/html": [
-       "Find logs at: <code>./wandb/run-20220507_220654-8czogswz/logs</code>"
+       "Find logs at: <code>./wandb/run-20220508_062506-2ovixu73/logs</code>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -298,7 +396,7 @@
  },
  {
   "cell_type": "markdown",
-   "id": "3ffa0dae",
+   "id": "e9f1e6a5",
   "metadata": {},
   "source": [
    "### Note\n",
@@ -308,7 +406,288 @@
  },
  {
   "cell_type": "markdown",
-   "id": "a03b8746",
+   "id": "4f448887",
+   "metadata": {},
+   "source": [
+    "## Package to 🤗 hub"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "f8d1b517",
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2022-05-08T01:13:41.386029Z",
+     "start_time": "2022-05-08T01:13:41.335337Z"
+    }
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": []
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# You have to disable wandb while packaging it to hub, because it seems to be interfering with package to hub function.\n",
+    "wandb.init(mode=\"disabled\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "5f93f140",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from huggingface_hub import notebook_login # To log to our Hugging Face account to be able to upload models to the Hub."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f0461e29",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Note: You just need to run notebook_login() once in any machine you are trying to login. The token is saved in you machine, making future access to your account easier\n",
+    "notebook_login()\n",
+    "!git config --global credential.helper store"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "7d7ea1b3",
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2022-05-08T01:14:35.254796Z",
+     "start_time": "2022-05-08T01:13:43.366135Z"
+    }
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[38;5;4mℹ This function will save, evaluate, generate a video of your agent,\n",
+      "create a model card and push everything to the hub. It might take up to 1min.\n",
+      "This is a work in progress: If you encounter a bug, please open an issue and use\n",
+      "push_to_hub instead.\u001b[0m\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/home/venom/miniconda3/envs/RL/lib/python3.7/site-packages/huggingface_hub/hf_api.py:82: FutureWarning: `name` and `organization` input arguments are deprecated and will be removed in v0.7. Pass `repo_id` instead.\n",
+      "  FutureWarning,\n",
+      "/home/venom/Desktop/deep-rl-class/unit1/unit1_bonus/hub/LunarLander_v2_PPO_wandb is already a clone of https://huggingface.co/SuperSecureHuman/LunarLander_v2_PPO_wandb. Make sure you pull the latest changes with `repo.git_pull()`.\n",
+      "/home/venom/miniconda3/envs/RL/lib/python3.7/site-packages/stable_baselines3/common/evaluation.py:69: UserWarning: Evaluation environment is not wrapped with a ``Monitor`` wrapper. This may result in reporting modified episode lengths and rewards, if other wrappers happen to modify these. Consider wrapping environment first with ``Monitor`` wrapper.\n",
+      "  UserWarning,\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Saving video to /home/venom/Desktop/deep-rl-class/unit1/unit1_bonus/-step-0-to-step-1000.mp4\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "ffmpeg version 4.2.2 Copyright (c) 2000-2019 the FFmpeg developers\n",
+      "  built with gcc 7.3.0 (crosstool-NG 1.23.0.449-a04d0)\n",
+      "  configuration: --prefix=/home/venom/miniconda3/envs/RL --cc=/tmp/build/80754af9/ffmpeg_1587154242452/_build_env/bin/x86_64-conda_cos6-linux-gnu-cc --disable-doc --enable-avresample --enable-gmp --enable-hardcoded-tables --enable-libfreetype --enable-libvpx --enable-pthreads --enable-libopus --enable-postproc --enable-pic --enable-pthreads --enable-shared --enable-static --enable-version3 --enable-zlib --enable-libmp3lame --disable-nonfree --enable-gpl --enable-gnutls --disable-openssl --enable-libopenh264 --enable-libx264\n",
+      "  libavutil      56. 31.100 / 56. 31.100\n",
+      "  libavcodec     58. 54.100 / 58. 54.100\n",
+      "  libavformat    58. 29.100 / 58. 29.100\n",
+      "  libavdevice    58.  8.100 / 58.  8.100\n",
+      "  libavfilter     7. 57.100 /  7. 57.100\n",
+      "  libavresample   4.  0.  0 /  4.  0.  0\n",
+      "  libswscale      5.  5.100 /  5.  5.100\n",
+      "  libswresample   3.  5.100 /  3.  5.100\n",
+      "  libpostproc    55.  5.100 / 55.  5.100\n",
+      "Input #0, mov,mp4,m4a,3gp,3g2,mj2, from './test.mp4':\n",
+      "  Metadata:\n",
+      "    major_brand     : isom\n",
+      "    minor_version   : 512\n",
+      "    compatible_brands: isomiso2avc1mp41\n",
+      "    encoder         : Lavf58.29.100\n",
+      "  Duration: 00:00:20.02, start: 0.000000, bitrate: 39 kb/s\n",
+      "    Stream #0:0(und): Video: h264 (High) (avc1 / 0x31637661), yuv420p, 600x400, 34 kb/s, 50 fps, 50 tbr, 12800 tbn, 100 tbc (default)\n",
+      "    Metadata:\n",
+      "      handler_name    : VideoHandler\n",
+      "Stream mapping:\n",
+      "  Stream #0:0 -> #0:0 (h264 (native) -> h264 (libx264))\n",
+      "Press [q] to stop, [?] for help\n",
+      "[libx264 @ 0x560e05024ec0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2 AVX512\n",
+      "[libx264 @ 0x560e05024ec0] profile High, level 3.1, 4:2:0, 8-bit\n",
+      "[libx264 @ 0x560e05024ec0] 264 - core 157 - H.264/MPEG-4 AVC codec - Copyleft 2003-2018 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=12 lookahead_threads=2 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n",
+      "Output #0, mp4, to 'replay.mp4':\n",
+      "  Metadata:\n",
+      "    major_brand     : isom\n",
+      "    minor_version   : 512\n",
+      "    compatible_brands: isomiso2avc1mp41\n",
+      "    encoder         : Lavf58.29.100\n",
+      "    Stream #0:0(und): Video: h264 (libx264) (avc1 / 0x31637661), yuv420p, 600x400, q=-1--1, 50 fps, 12800 tbn, 50 tbc (default)\n",
+      "    Metadata:\n",
+      "      handler_name    : VideoHandler\n",
+      "      encoder         : Lavc58.54.100 libx264\n",
+      "    Side data:\n",
+      "      cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: -1\n",
+      "frame= 1001 fps=0.0 q=-1.0 Lsize=      94kB time=00:00:19.96 bitrate=  38.7kbits/s speed=27.4x    \n",
+      "video:82kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 15.259376%\n",
+      "[libx264 @ 0x560e05024ec0] frame I:5     Avg QP:10.02  size:  1676\n",
+      "[libx264 @ 0x560e05024ec0] frame P:259   Avg QP:17.41  size:    99\n",
+      "[libx264 @ 0x560e05024ec0] frame B:737   Avg QP:20.72  size:    67\n",
+      "[libx264 @ 0x560e05024ec0] consecutive B-frames:  1.0%  1.8%  2.1% 95.1%\n",
+      "[libx264 @ 0x560e05024ec0] mb I  I16..4: 87.6%  7.3%  5.0%\n",
+      "[libx264 @ 0x560e05024ec0] mb P  I16..4:  0.1%  0.3%  0.1%  P16..4:  0.9%  0.1%  0.0%  0.0%  0.0%    skip:98.5%\n",
+      "[libx264 @ 0x560e05024ec0] mb B  I16..4:  0.0%  0.0%  0.1%  B16..8:  1.2%  0.1%  0.0%  direct: 0.0%  skip:98.6%  L0:57.8% L1:41.6% BI: 0.5%\n",
+      "[libx264 @ 0x560e05024ec0] 8x8 transform intra:17.5% inter:12.1%\n",
+      "[libx264 @ 0x560e05024ec0] coded y,uvDC,uvAC intra: 6.9% 9.7% 9.3% inter: 0.1% 0.1% 0.0%\n",
+      "[libx264 @ 0x560e05024ec0] i16 v,h,dc,p: 89%  5%  6%  0%\n",
+      "[libx264 @ 0x560e05024ec0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 26%  8% 65%  0%  0%  0%  0%  0%  0%\n",
+      "[libx264 @ 0x560e05024ec0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 13% 14% 60%  2%  2%  2%  3%  2%  3%\n",
+      "[libx264 @ 0x560e05024ec0] i8c dc,h,v,p: 96%  3%  2%  0%\n",
+      "[libx264 @ 0x560e05024ec0] Weighted P-Frames: Y:0.0% UV:0.0%\n",
+      "[libx264 @ 0x560e05024ec0] ref P L0: 76.2%  0.8% 16.4%  6.6%\n",
+      "[libx264 @ 0x560e05024ec0] ref B L0: 62.0% 34.4%  3.7%\n",
+      "[libx264 @ 0x560e05024ec0] ref B L1: 94.1%  5.9%\n",
+      "[libx264 @ 0x560e05024ec0] kb/s:33.21\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[38;5;4mℹ Pushing repo LunarLander_v2_PPO_wandb to the Hugging Face Hub\u001b[0m\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ee4b1a1441da4bff8a0a30cbfaa79d54",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Upload file PPO-LunarLander-v2.zip:  23%|##2       | 32.0k/141k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ea5e56decd7142dea38707f5b56eede1",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Upload file PPO-LunarLander-v2/policy.optimizer.pth:  39%|###8      | 32.0k/82.8k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e716bdab138e4b9cb10d30387ba16953",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Upload file PPO-LunarLander-v2/policy.pth:  76%|#######5  | 32.0k/42.2k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b966e0bc19604640b3eb0cea62265631",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Upload file replay.mp4:  34%|###3      | 32.0k/94.3k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d357e49f80d94c569864c2daca4974e5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Upload file PPO-LunarLander-v2/pytorch_variables.pth: 100%|##########| 431/431 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "remote: Enforcing permissions...        \n",
+      "remote: Allowed refs: all        \n",
+      "To https://huggingface.co/SuperSecureHuman/LunarLander_v2_PPO_wandb\n",
+      "   b5f588e..67fd722  main -> main\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[38;5;4mℹ Your model is pushed to the hub. You can view your model here:\n",
+      "https://huggingface.co/SuperSecureHuman/LunarLander_v2_PPO_wandb\u001b[0m\n"
+     ]
+    }
+   ],
+   "source": [
+    "from huggingface_sb3 import package_to_hub\n",
+    "\n",
+    "env_id = config[\"env_name\"]\n",
+    "\n",
+    "model_architecture = \"PPO\"\n",
+    "model_name = \"PPO-LunarLander-v2\"\n",
+    "\n",
+    "repo_id = \"SuperSecureHuman/LunarLander_v2_PPO_wandb\"\n",
+    "\n",
+    "commit_message = \"Initial Commit\"\n",
+    "\n",
+    "eval_env = DummyVecEnv([lambda: gym.make(env_id)])\n",
+    "\n",
+    "package_to_hub(model=model, # Our trained model\n",
+    "               model_name=model_name, # The name of our trained model \n",
+    "               model_architecture=model_architecture, # The model architecture we used: in our case PPO\n",
+    "               env_id=env_id, # Name of the environment\n",
+    "               eval_env=eval_env, # Evaluation Environment\n",
+    "               repo_id=repo_id, # id of the model repository from the Hugging Face Hub\n",
+    "               commit_message=commit_message)\n",
+    "eval_env.close()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9368a9f9",
   "metadata": {},
   "source": [
    "## Congarts!\n",