|
2 | 2 | "cells": [
|
3 | 3 | {
|
4 | 4 | "cell_type": "code",
|
5 |
| - "execution_count": 19, |
| 5 | + "execution_count": 1, |
6 | 6 | "id": "08a04217-5d99-41e2-b2b3-31c286a26936",
|
7 | 7 | "metadata": {},
|
8 |
| - "outputs": [ |
9 |
| - { |
10 |
| - "name": "stdout", |
11 |
| - "output_type": "stream", |
12 |
| - "text": [ |
13 |
| - "The autoreload extension is already loaded. To reload it, use:\n", |
14 |
| - " %reload_ext autoreload\n" |
15 |
| - ] |
16 |
| - } |
17 |
| - ], |
| 8 | + "outputs": [], |
18 | 9 | "source": [
|
19 | 10 | "import geopandas as gpd\n",
|
20 | 11 | "import pandas as pd\n",
|
|
114 | 105 | },
|
115 | 106 | {
|
116 | 107 | "cell_type": "code",
|
117 |
| - "execution_count": 8, |
| 108 | + "execution_count": 5, |
118 | 109 | "id": "12ecddb4-8a5b-48e0-9281-f0d128740222",
|
119 | 110 | "metadata": {},
|
120 | 111 | "outputs": [
|
121 | 112 | {
|
122 | 113 | "name": "stderr",
|
123 | 114 | "output_type": "stream",
|
124 | 115 | "text": [
|
125 |
| - "\u001b[32m2024-06-03 21:59:01.002\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m98\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
126 |
| - "\u001b[32m2024-06-03 21:59:01.004\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m111\u001b[0m - \u001b[1mread train split with 72268 chip files (out of 72268)\u001b[0m\n", |
127 |
| - "\u001b[32m2024-06-03 21:59:01.004\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m115\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
128 |
| - "\u001b[32m2024-06-03 21:59:01.447\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m123\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
129 |
| - "\u001b[32m2024-06-03 21:59:02.923\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m98\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
130 |
| - "\u001b[32m2024-06-03 21:59:02.925\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m111\u001b[0m - \u001b[1mread val split with 14770 chip files (out of 14770)\u001b[0m\n", |
131 |
| - "\u001b[32m2024-06-03 21:59:02.926\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m115\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
132 |
| - "\u001b[32m2024-06-03 21:59:03.333\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m123\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
133 |
| - "\u001b[32m2024-06-03 21:59:04.614\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m98\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
134 |
| - "\u001b[32m2024-06-03 21:59:04.617\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m111\u001b[0m - \u001b[1mread test split with 17202 chip files (out of 17202)\u001b[0m\n", |
135 |
| - "\u001b[32m2024-06-03 21:59:04.617\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m115\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
136 |
| - "\u001b[32m2024-06-03 21:59:05.033\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m123\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
137 |
| - "\u001b[32m2024-06-03 21:59:05.035\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.chipmultilabel\u001b[0m:\u001b[36mcompute\u001b[0m:\u001b[36m41\u001b[0m - \u001b[1mreading means and stddevs from /opt/data/california-naip-chips/california-naip-chips-100k_metadata_embeddings_meansstdevs.pkl\u001b[0m\n" |
| 116 | + "\u001b[32m2024-06-04 17:10:23.099\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m100\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
| 117 | + "\u001b[32m2024-06-04 17:10:23.101\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m113\u001b[0m - \u001b[1mread train split with 72268 chip files (out of 72268)\u001b[0m\n", |
| 118 | + "\u001b[32m2024-06-04 17:10:23.101\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m117\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
| 119 | + "\u001b[32m2024-06-04 17:10:23.523\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m125\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
| 120 | + "\u001b[32m2024-06-04 17:10:24.827\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m100\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
| 121 | + "\u001b[32m2024-06-04 17:10:24.830\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m113\u001b[0m - \u001b[1mread val split with 14770 chip files (out of 14770)\u001b[0m\n", |
| 122 | + "\u001b[32m2024-06-04 17:10:24.830\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m117\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
| 123 | + "\u001b[32m2024-06-04 17:10:25.228\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m125\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
| 124 | + "\u001b[32m2024-06-04 17:10:26.502\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m100\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
| 125 | + "\u001b[32m2024-06-04 17:10:26.505\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m113\u001b[0m - \u001b[1mread test split with 17202 chip files (out of 17202)\u001b[0m\n", |
| 126 | + "\u001b[32m2024-06-04 17:10:26.505\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m117\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
| 127 | + "\u001b[32m2024-06-04 17:10:26.908\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m125\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
| 128 | + "\u001b[32m2024-06-04 17:10:26.910\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.chipmultilabel\u001b[0m:\u001b[36mcompute\u001b[0m:\u001b[36m41\u001b[0m - \u001b[1mreading means and stddevs from /opt/data/california-naip-chips/california-naip-chips-100k_metadata_embeddings_meansstdevs.pkl\u001b[0m\n" |
138 | 129 | ]
|
139 | 130 | }
|
140 | 131 | ],
|
|
147 | 138 | },
|
148 | 139 | {
|
149 | 140 | "cell_type": "code",
|
150 |
| - "execution_count": 12, |
| 141 | + "execution_count": 6, |
151 | 142 | "id": "5fa5944f-b902-4fab-a017-19b7e020b903",
|
152 | 143 | "metadata": {},
|
153 | 144 | "outputs": [
|
|
157 | 148 | "(17, 17, 768)"
|
158 | 149 | ]
|
159 | 150 | },
|
160 |
| - "execution_count": 12, |
| 151 | + "execution_count": 6, |
161 | 152 | "metadata": {},
|
162 | 153 | "output_type": "execute_result"
|
163 | 154 | }
|
|
184 | 175 | },
|
185 | 176 | {
|
186 | 177 | "cell_type": "code",
|
187 |
| - "execution_count": 15, |
| 178 | + "execution_count": 7, |
188 | 179 | "id": "a85712fa-17f0-4690-a0c2-487be97ea799",
|
189 | 180 | "metadata": {},
|
190 | 181 | "outputs": [],
|
|
194 | 185 | },
|
195 | 186 | {
|
196 | 187 | "cell_type": "code",
|
197 |
| - "execution_count": 16, |
| 188 | + "execution_count": 8, |
198 | 189 | "id": "3fa30ac9-0376-4494-b048-19f8ffc0d41f",
|
199 | 190 | "metadata": {},
|
200 | 191 | "outputs": [],
|
|
204 | 195 | },
|
205 | 196 | {
|
206 | 197 | "cell_type": "code",
|
207 |
| - "execution_count": 18, |
| 198 | + "execution_count": 9, |
208 | 199 | "id": "4ff9295c-4ff8-4b31-9465-70a03ff23b51",
|
209 | 200 | "metadata": {},
|
210 | 201 | "outputs": [
|
|
214 | 205 | "torch.Size([16, 17, 17, 768])"
|
215 | 206 | ]
|
216 | 207 | },
|
217 |
| - "execution_count": 18, |
| 208 | + "execution_count": 9, |
| 209 | + "metadata": {}, |
| 210 | + "output_type": "execute_result" |
| 211 | + } |
| 212 | + ], |
| 213 | + "source": [ |
| 214 | + "batch['embedding'].shape" |
| 215 | + ] |
| 216 | + }, |
| 217 | + { |
| 218 | + "cell_type": "markdown", |
| 219 | + "id": "a75faa90-5b40-4c8f-be84-376b6893b0fd", |
| 220 | + "metadata": {}, |
| 221 | + "source": [ |
| 222 | + "---" |
| 223 | + ] |
| 224 | + }, |
| 225 | + { |
| 226 | + "cell_type": "markdown", |
| 227 | + "id": "ec2a0ec5-ab77-4712-bd15-dc7bb561300d", |
| 228 | + "metadata": {}, |
| 229 | + "source": [ |
| 230 | + "smaller neighborhood radius" |
| 231 | + ] |
| 232 | + }, |
| 233 | + { |
| 234 | + "cell_type": "code", |
| 235 | + "execution_count": 10, |
| 236 | + "id": "ad97b784-56bd-497e-9f41-107887db6499", |
| 237 | + "metadata": {}, |
| 238 | + "outputs": [ |
| 239 | + { |
| 240 | + "name": "stderr", |
| 241 | + "output_type": "stream", |
| 242 | + "text": [ |
| 243 | + "\u001b[32m2024-06-04 17:11:50.681\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m100\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
| 244 | + "\u001b[32m2024-06-04 17:11:50.684\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m113\u001b[0m - \u001b[1mread train split with 72268 chip files (out of 72268)\u001b[0m\n", |
| 245 | + "\u001b[32m2024-06-04 17:11:50.684\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m117\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
| 246 | + "\u001b[32m2024-06-04 17:11:51.103\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m125\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
| 247 | + "\u001b[32m2024-06-04 17:11:52.474\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m100\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
| 248 | + "\u001b[32m2024-06-04 17:11:52.478\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m113\u001b[0m - \u001b[1mread val split with 14770 chip files (out of 14770)\u001b[0m\n", |
| 249 | + "\u001b[32m2024-06-04 17:11:52.478\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m117\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
| 250 | + "\u001b[32m2024-06-04 17:11:52.876\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m125\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
| 251 | + "\u001b[32m2024-06-04 17:11:54.286\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m100\u001b[0m - \u001b[1musing embeddings found in metadata file\u001b[0m\n", |
| 252 | + "\u001b[32m2024-06-04 17:11:54.289\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m113\u001b[0m - \u001b[1mread test split with 17202 chip files (out of 17202)\u001b[0m\n", |
| 253 | + "\u001b[32m2024-06-04 17:11:54.290\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m117\u001b[0m - \u001b[1mremoving chip IDs with no associated neighbors .npy files\u001b[0m\n", |
| 254 | + "\u001b[32m2024-06-04 17:11:54.694\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.components.chipmultilabel\u001b[0m:\u001b[36m__init__\u001b[0m:\u001b[36m125\u001b[0m - \u001b[1mmax cache size is -1\u001b[0m\n", |
| 255 | + "\u001b[32m2024-06-04 17:11:54.697\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mearthtext.datamodules.chipmultilabel\u001b[0m:\u001b[36mcompute\u001b[0m:\u001b[36m41\u001b[0m - \u001b[1mreading means and stddevs from /opt/data/california-naip-chips/california-naip-chips-100k_metadata_embeddings_meansstdevs.pkl\u001b[0m\n" |
| 256 | + ] |
| 257 | + } |
| 258 | + ], |
| 259 | + "source": [ |
| 260 | + "conf.dataloader.neighborhood_radius = 5\n", |
| 261 | + "dl = hydra.utils.instantiate(conf.dataloader)" |
| 262 | + ] |
| 263 | + }, |
| 264 | + { |
| 265 | + "cell_type": "code", |
| 266 | + "execution_count": 11, |
| 267 | + "id": "7765d322-4822-43fb-a8cf-9cf8a6741b7b", |
| 268 | + "metadata": {}, |
| 269 | + "outputs": [ |
| 270 | + { |
| 271 | + "data": { |
| 272 | + "text/plain": [ |
| 273 | + "(11, 11, 768)" |
| 274 | + ] |
| 275 | + }, |
| 276 | + "execution_count": 11, |
| 277 | + "metadata": {}, |
| 278 | + "output_type": "execute_result" |
| 279 | + } |
| 280 | + ], |
| 281 | + "source": [ |
| 282 | + "dl.train_dataset[0]['embedding'].shape" |
| 283 | + ] |
| 284 | + }, |
| 285 | + { |
| 286 | + "cell_type": "code", |
| 287 | + "execution_count": 12, |
| 288 | + "id": "c27ef4fe-0bd6-453a-bbb6-43e273a87cf2", |
| 289 | + "metadata": {}, |
| 290 | + "outputs": [ |
| 291 | + { |
| 292 | + "data": { |
| 293 | + "text/plain": [ |
| 294 | + "torch.Size([16, 11, 11, 768])" |
| 295 | + ] |
| 296 | + }, |
| 297 | + "execution_count": 12, |
218 | 298 | "metadata": {},
|
219 | 299 | "output_type": "execute_result"
|
220 | 300 | }
|
221 | 301 | ],
|
222 | 302 | "source": [
|
| 303 | + "dltrain = dl.train_dataloader()\n", |
| 304 | + "batch = next(iter(dltrain))\n", |
223 | 305 | "batch['embedding'].shape"
|
224 | 306 | ]
|
225 | 307 | }
|
|
0 commit comments