re-compute image normalization m&std

Sylvain Le Groux · Sylvain Le Groux · commit b9aab5131f88 · 2025-02-10T20:47:42.000-08:00
diff --git a/config/data/image/tiny_imagenet.yaml b/config/data/image/tiny_imagenet.yaml
@@ -11,8 +11,10 @@ transforms:
   transforms:
     - _target_: torchvision.transforms.ToTensor
     - _target_: torchvision.transforms.Normalize
-      mean: [0.4822, 0.4495, 0.3985]
-      std: [0.2771, 0.2690, 0.2826]
+      mean: [0.4822, 0.4494, 0.3978]
+      std: [0.2754, 0.2679, 0.2811]
+      # mean: [0.4822, 0.4495, 0.3985]
+      # std: [0.2771, 0.2690, 0.2826]
     # - _target_: torchvision.transforms.Resize
     #   size: [32,32]
 
diff --git a/config/data/image/tiny_imagenet_aug.yaml b/config/data/image/tiny_imagenet_aug.yaml
@@ -11,8 +11,8 @@ transforms:
   transforms:
     - _target_: torchvision.transforms.ToTensor
     - _target_: torchvision.transforms.Normalize
-      mean: [0.4822, 0.4495, 0.3985]
-      std: [0.2771, 0.2690, 0.2826]
+      mean: [0.4822, 0.4494, 0.3978]
+      std: [0.2754, 0.2679, 0.2811]
     - _target_: torchvision.transforms.Resize
       size: 64
     - _target_: torchvision.transforms.RandomCrop
diff --git a/nbs/image.datasets.ipynb b/nbs/image.datasets.ipynb
@@ -23,16 +23,7 @@
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "The autoreload extension is already loaded. To reload it, use:\n",
-      "  %reload_ext autoreload\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "#| hide\n",
     "%load_ext autoreload\n",
@@ -462,7 +453,100 @@
     "        n_rows:int=3, # Number of rows in the grid\n",
     "        n_cols:int=3 # Number of columns in the grid\n",
     "        ):\n",
-    "        self.plot_grid(self, n_rows, n_cols, self.hf_ds.features['label'].int2str)"
+    "        self.plot_grid(self, n_rows, n_cols, self.hf_ds.features['label'].int2str)\n",
+    "    \n",
+    "    def compute_image_normalization(self):\n",
+    "        full_dl = DataLoader(self, batch_size=len(self))\n",
+    "        full_batch = next(iter(full_dl))\n",
+    "        mean = full_batch[0].float().mean([0,2,3])\n",
+    "        std = full_batch[0].float().std([0,2,3])\n",
+    "        return mean, std"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Image normalization\n",
+    "if both train and validation splits are available normalize both. else just train\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "[16:22:46] INFO - loading dataset slegroux/tiny-imagenet-200-clean with args () from split train\n",
+      "[16:22:46] INFO - loading dataset slegroux/tiny-imagenet-200-clean from split train\n",
+      "Overwrite dataset info from restored data version if exists.\n",
+      "[16:22:48] INFO - Overwrite dataset info from restored data version if exists.\n",
+      "Loading Dataset info from ../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "[16:22:48] INFO - Loading Dataset info from ../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "Found cached dataset tiny-imagenet-200-clean (/user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2)\n",
+      "[16:22:48] INFO - Found cached dataset tiny-imagenet-200-clean (/user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2)\n",
+      "Loading Dataset info from /user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "[16:22:48] INFO - Loading Dataset info from /user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "[16:23:04] INFO - loading dataset slegroux/tiny-imagenet-200-clean with args () from split validation\n",
+      "[16:23:04] INFO - loading dataset slegroux/tiny-imagenet-200-clean from split validation\n",
+      "Overwrite dataset info from restored data version if exists.\n",
+      "[16:23:05] INFO - Overwrite dataset info from restored data version if exists.\n",
+      "Loading Dataset info from ../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "[16:23:05] INFO - Loading Dataset info from ../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "Found cached dataset tiny-imagenet-200-clean (/user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2)\n",
+      "[16:23:05] INFO - Found cached dataset tiny-imagenet-200-clean (/user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2)\n",
+      "Loading Dataset info from /user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n",
+      "[16:23:05] INFO - Loading Dataset info from /user/s/slegroux/Projects/nimrod/nbs/../data/image/slegroux___tiny-imagenet-200-clean/default/0.0.0/4b908d89fab3eb36aa8ebcd41c1996b28da7d6f2\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\">mean:<span style=\"color: #800080; text-decoration-color: #800080; font-weight: bold\">tensor</span><span style=\"font-weight: bold\">([</span><span style=\"color: #008080; text-decoration-color: #008080; font-weight: bold\">0.4822</span>, <span style=\"color: #008080; text-decoration-color: #008080; font-weight: bold\">0.4494</span>, <span style=\"color: #008080; text-decoration-color: #008080; font-weight: bold\">0.3978</span><span style=\"font-weight: bold\">])</span>, std: <span style=\"color: #800080; text-decoration-color: #800080; font-weight: bold\">tensor</span><span style=\"font-weight: bold\">([</span><span style=\"color: #008080; text-decoration-color: #008080; font-weight: bold\">0.2754</span>, <span style=\"color: #008080; text-decoration-color: #008080; font-weight: bold\">0.2679</span>, <span style=\"color: #008080; text-decoration-color: #008080; font-weight: bold\">0.2811</span><span style=\"font-weight: bold\">])</span>\n",
+       "</pre>\n"
+      ],
+      "text/plain": [
+       "mean:\u001b[1;35mtensor\u001b[0m\u001b[1m(\u001b[0m\u001b[1m[\u001b[0m\u001b[1;36m0.4822\u001b[0m, \u001b[1;36m0.4494\u001b[0m, \u001b[1;36m0.3978\u001b[0m\u001b[1m]\u001b[0m\u001b[1m)\u001b[0m, std: \u001b[1;35mtensor\u001b[0m\u001b[1m(\u001b[0m\u001b[1m[\u001b[0m\u001b[1;36m0.2754\u001b[0m, \u001b[1;36m0.2679\u001b[0m, \u001b[1;36m0.2811\u001b[0m\u001b[1m]\u001b[0m\u001b[1m)\u001b[0m\n"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "#| export\n",
+    "\n",
+    "def normalize_image_datasets(name, data_dir='../data/image', splits=['train', 'validation']):\n",
+    "    mean, std = [], []\n",
+    "    for split in splits:\n",
+    "\n",
+    "        ds = ImageDataset(\n",
+    "            name=name,\n",
+    "            data_dir=data_dir,\n",
+    "            split=split,\n",
+    "        )\n",
+    "        m, s = ds.compute_image_normalization()\n",
+    "        mean.append(m)\n",
+    "        std.append(s)\n",
+    "\n",
+    "    mean = torch.stack(mean).mean(dim=0)\n",
+    "    std = torch.stack(std).mean(dim=0)\n",
+    "    return mean, std"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#| notest\n",
+    "\n",
+    "mean, std = normalize_image_datasets('slegroux/tiny-imagenet-200-clean')\n",
+    "print(f\"mean:{mean}, std: {std}\")"
    ]
   },
   {
diff --git a/nimrod/_modidx.py b/nimrod/_modidx.py
@@ -195,6 +195,8 @@
                                                                                         'nimrod/image/datasets.py'),
                                        'nimrod.image.datasets.ImageDataset.__len__': ( 'image.datasets.html#imagedataset.__len__',
                                                                                        'nimrod/image/datasets.py'),
+                                       'nimrod.image.datasets.ImageDataset.compute_image_normalization': ( 'image.datasets.html#imagedataset.compute_image_normalization',
+                                                                                                           'nimrod/image/datasets.py'),
                                        'nimrod.image.datasets.ImageDataset.dim': ( 'image.datasets.html#imagedataset.dim',
                                                                                    'nimrod/image/datasets.py'),
                                        'nimrod.image.datasets.ImageDataset.int2str': ( 'image.datasets.html#imagedataset.int2str',
@@ -232,6 +234,8 @@
                                        'nimrod.image.datasets.ImageSuperResDataset.__init__': ( 'image.datasets.html#imagesuperresdataset.__init__',
                                                                                                 'nimrod/image/datasets.py'),
                                        'nimrod.image.datasets.make_grid': ('image.datasets.html#make_grid', 'nimrod/image/datasets.py'),
+                                       'nimrod.image.datasets.normalize_image_datasets': ( 'image.datasets.html#normalize_image_datasets',
+                                                                                           'nimrod/image/datasets.py'),
                                        'nimrod.image.datasets.show_images': ( 'image.datasets.html#show_images',
                                                                               'nimrod/image/datasets.py')},
             'nimrod.image.med': { 'nimrod.image.med.BertAttention': ('image.med.html#bertattention', 'nimrod/image/med.py'),
diff --git a/nimrod/image/datasets.py b/nimrod/image/datasets.py
@@ -3,8 +3,8 @@
 # AUTOGENERATED! DO NOT EDIT! File to edit: ../../nbs/image.datasets.ipynb.
 
 # %% auto 0
-__all__ = ['logger', 'TFM_LOW_RES', 'show_images', 'make_grid', 'ImagePlotMixin', 'ImageDataset', 'ImageDataModule',
-           'ImageSuperResDataset', 'ImageSuperResDataModule']
+__all__ = ['logger', 'TFM_LOW_RES', 'show_images', 'make_grid', 'ImagePlotMixin', 'ImageDataset', 'normalize_image_datasets',
+           'ImageDataModule', 'ImageSuperResDataset', 'ImageSuperResDataModule']
 
 # %% ../../nbs/image.datasets.ipynb 3
 # torch
@@ -346,8 +346,33 @@ def show_grid(
         n_cols:int=3 # Number of columns in the grid
         ):
         self.plot_grid(self, n_rows, n_cols, self.hf_ds.features['label'].int2str)
+    
+    def compute_image_normalization(self):
+        full_dl = DataLoader(self, batch_size=len(self))
+        full_batch = next(iter(full_dl))
+        mean = full_batch[0].float().mean([0,2,3])
+        std = full_batch[0].float().std([0,2,3])
+        return mean, std
 
 # %% ../../nbs/image.datasets.ipynb 12
+def normalize_image_datasets(name, data_dir='../data/image', splits=['train', 'validation']):
+    mean, std = [], []
+    for split in splits:
+
+        ds = ImageDataset(
+            name=name,
+            data_dir=data_dir,
+            split=split,
+        )
+        m, s = ds.compute_image_normalization()
+        mean.append(m)
+        std.append(s)
+
+    mean = torch.stack(mean).mean(dim=0)
+    std = torch.stack(std).mean(dim=0)
+    return mean, std
+
+# %% ../../nbs/image.datasets.ipynb 15
 class ImageDataModule(ImagePlotMixin, DataModule):
 
     def __init__(
@@ -510,7 +535,7 @@ def show_batch(
         return grid_im
 
 
-# %% ../../nbs/image.datasets.ipynb 23
+# %% ../../nbs/image.datasets.ipynb 26
 TFM_LOW_RES = transforms.Compose(
     [
         transforms.Resize((32, 32), antialias=True), 
@@ -549,7 +574,7 @@ def __getitem__(self, idx:int) -> Tuple[torch.FloatTensor, torch.FloatTensor]:
         return image_x, image_y
         
 
-# %% ../../nbs/image.datasets.ipynb 27
+# %% ../../nbs/image.datasets.ipynb 30
 TFM_LOW_RES = nn.Sequential(
     transforms.Resize((32, 32), antialias=True),
     transforms.Resize((64, 64), antialias=True)
diff --git a/tutorials/tiny_imagenet.ipynb b/tutorials/tiny_imagenet.ipynb