|
1180 | 1180 | "metadata": {}, |
1181 | 1181 | "outputs": [], |
1182 | 1182 | "source": [ |
1183 | | - "begin = datetime.strptime(\"05/06/20 16:30\", \"%d/%m/%y %H:%M\")\n", |
1184 | | - "end = datetime.strptime(\"15/06/21 16:30\", \"%d/%m/%y %H:%M\")\n", |
| 1183 | + "begin = datetime.strptime(\"20-07-31 20:30\", \"%y-%m-%d %H:%M\")\n", |
| 1184 | + "end = datetime.strptime(\"21-07-31 20:30\", \"%y-%m-%d %H:%M\")\n", |
1185 | 1185 | "\n", |
1186 | 1186 | "begin_utc = pytz.utc.localize(begin)\n", |
1187 | 1187 | "end_utc = pytz.utc.localize(end)" |
|
1200 | 1200 | "metadata": {}, |
1201 | 1201 | "outputs": [], |
1202 | 1202 | "source": [ |
1203 | | - "begin = datetime.strptime(\"05/06/20 16:30\", \"%d/%m/%y %H:%M\")\n", |
1204 | | - "end = datetime.strptime(\"10/06/21 16:30\", \"%d/%m/%y %H:%M\")\n", |
| 1203 | + "begin = datetime.strptime(\"20-07-31 20:30\", \"%y-%m-%d %H:%M\")\n", |
| 1204 | + "end = datetime.strptime(\"21-07-31 20:30\", \"%y-%m-%d %H:%M\")\n", |
1205 | 1205 | "\n", |
1206 | 1206 | "timezone = pytz.timezone(\"America/Los_Angeles\")\n", |
1207 | 1207 | "\n", |
1208 | 1208 | "begin_Los_Angeles = timezone.localize(begin)\n", |
1209 | 1209 | "end_Los_Angeles = timezone.localize(end)" |
1210 | 1210 | ] |
1211 | 1211 | }, |
1212 | | - { |
1213 | | - "cell_type": "code", |
1214 | | - "execution_count": 21, |
1215 | | - "metadata": {}, |
1216 | | - "outputs": [ |
1217 | | - { |
1218 | | - "name": "stdout", |
1219 | | - "output_type": "stream", |
1220 | | - "text": [ |
1221 | | - "2020-06-05 16:30:00+00:00\n", |
1222 | | - "2021-06-15 16:30:00+00:00\n", |
1223 | | - "2020-06-05 16:30:00-07:00\n", |
1224 | | - "2021-06-10 16:30:00-07:00\n" |
1225 | | - ] |
1226 | | - } |
1227 | | - ], |
1228 | | - "source": [ |
1229 | | - "print(begin_utc)\n", |
1230 | | - "print(end_utc)\n", |
1231 | | - "print(begin_Los_Angeles)\n", |
1232 | | - "print(end_Los_Angeles)" |
1233 | | - ] |
1234 | | - }, |
1235 | 1212 | { |
1236 | 1213 | "cell_type": "markdown", |
1237 | 1214 | "metadata": {}, |
1238 | 1215 | "source": [ |
1239 | | - "### 5.3 Read json with no LastModified filter " |
| 1216 | + "### 5.3 Read json using the LastModified filters " |
1240 | 1217 | ] |
1241 | 1218 | }, |
1242 | 1219 | { |
1243 | 1220 | "cell_type": "code", |
1244 | | - "execution_count": 22, |
1245 | | - "metadata": {}, |
1246 | | - "outputs": [ |
1247 | | - { |
1248 | | - "name": "stdout", |
1249 | | - "output_type": "stream", |
1250 | | - "text": [ |
1251 | | - "# read_fwf\n", |
1252 | | - " id name date\n", |
1253 | | - "0 1 Herfelingen 27-12-18\n", |
1254 | | - "1 2 Lambusart 14-06-18\n", |
1255 | | - "2 3 Spormaggiore 15-04-18\n", |
1256 | | - "3 4 Buizingen 05-09-19\n", |
1257 | | - "4 5 San Rafael 04-09-19\n", |
1258 | | - "\n", |
1259 | | - " read_json\n", |
1260 | | - " id name\n", |
1261 | | - "0 1 foo\n", |
1262 | | - "1 2 boo\n", |
1263 | | - "0 3 bar\n", |
1264 | | - "\n", |
1265 | | - " read_csv\n", |
1266 | | - " id name\n", |
1267 | | - "0 1 foo\n", |
1268 | | - "1 2 boo\n", |
1269 | | - "2 3 bar\n", |
1270 | | - "\n", |
1271 | | - " read_parquet\n" |
1272 | | - ] |
1273 | | - }, |
1274 | | - { |
1275 | | - "data": { |
1276 | | - "text/html": [ |
1277 | | - "<div>\n", |
1278 | | - "<style scoped>\n", |
1279 | | - " .dataframe tbody tr th:only-of-type {\n", |
1280 | | - " vertical-align: middle;\n", |
1281 | | - " }\n", |
1282 | | - "\n", |
1283 | | - " .dataframe tbody tr th {\n", |
1284 | | - " vertical-align: top;\n", |
1285 | | - " }\n", |
1286 | | - "\n", |
1287 | | - " .dataframe thead th {\n", |
1288 | | - " text-align: right;\n", |
1289 | | - " }\n", |
1290 | | - "</style>\n", |
1291 | | - "<table border=\"1\" class=\"dataframe\">\n", |
1292 | | - " <thead>\n", |
1293 | | - " <tr style=\"text-align: right;\">\n", |
1294 | | - " <th></th>\n", |
1295 | | - " <th>id</th>\n", |
1296 | | - " <th>name</th>\n", |
1297 | | - " </tr>\n", |
1298 | | - " </thead>\n", |
1299 | | - " <tbody>\n", |
1300 | | - " <tr>\n", |
1301 | | - " <th>0</th>\n", |
1302 | | - " <td>1</td>\n", |
1303 | | - " <td>foo</td>\n", |
1304 | | - " </tr>\n", |
1305 | | - " <tr>\n", |
1306 | | - " <th>1</th>\n", |
1307 | | - " <td>2</td>\n", |
1308 | | - " <td>boo</td>\n", |
1309 | | - " </tr>\n", |
1310 | | - " <tr>\n", |
1311 | | - " <th>2</th>\n", |
1312 | | - " <td>3</td>\n", |
1313 | | - " <td>bar</td>\n", |
1314 | | - " </tr>\n", |
1315 | | - " </tbody>\n", |
1316 | | - "</table>\n", |
1317 | | - "</div>" |
1318 | | - ], |
1319 | | - "text/plain": [ |
1320 | | - " id name\n", |
1321 | | - "0 1 foo\n", |
1322 | | - "1 2 boo\n", |
1323 | | - "2 3 bar" |
1324 | | - ] |
1325 | | - }, |
1326 | | - "execution_count": 22, |
1327 | | - "metadata": {}, |
1328 | | - "output_type": "execute_result" |
1329 | | - } |
1330 | | - ], |
1331 | | - "source": [ |
1332 | | - "print('# read_fwf')\n", |
1333 | | - "print(wr.s3.read_fwf(f\"s3://{bucket}/fwf/\", names=[\"id\", \"name\", \"date\"]))\n", |
1334 | | - "print('\\n read_json')\n", |
1335 | | - "print(wr.s3.read_json(f\"s3://{bucket}/json/\"))\n", |
1336 | | - "print('\\n read_csv')\n", |
1337 | | - "print(wr.s3.read_csv(f\"s3://{bucket}/csv/\"))\n", |
1338 | | - "print('\\n read_parquet')\n", |
1339 | | - "wr.s3.read_parquet(f\"s3://{bucket}/parquet/\")" |
1340 | | - ] |
1341 | | - }, |
1342 | | - { |
1343 | | - "cell_type": "markdown", |
1344 | | - "metadata": {}, |
1345 | | - "source": [ |
1346 | | - "### 5.4 Read json using the LastModified filter " |
1347 | | - ] |
1348 | | - }, |
1349 | | - { |
1350 | | - "cell_type": "code", |
1351 | | - "execution_count": 23, |
| 1221 | + "execution_count": 21, |
1352 | 1222 | "metadata": {}, |
1353 | | - "outputs": [ |
1354 | | - { |
1355 | | - "name": "stdout", |
1356 | | - "output_type": "stream", |
1357 | | - "text": [ |
1358 | | - "# read_fwf\n", |
1359 | | - " id name date\n", |
1360 | | - "0 1 Herfelingen 27-12-18\n", |
1361 | | - "1 2 Lambusart 14-06-18\n", |
1362 | | - "2 3 Spormaggiore 15-04-18\n", |
1363 | | - "3 4 Buizingen 05-09-19\n", |
1364 | | - "4 5 San Rafael 04-09-19\n", |
1365 | | - "\n", |
1366 | | - " read_json\n", |
1367 | | - " id name\n", |
1368 | | - "0 1 foo\n", |
1369 | | - "1 2 boo\n", |
1370 | | - "0 3 bar\n", |
1371 | | - "\n", |
1372 | | - " read_csv\n", |
1373 | | - " id name\n", |
1374 | | - "0 1 foo\n", |
1375 | | - "1 2 boo\n", |
1376 | | - "2 3 bar\n", |
1377 | | - "\n", |
1378 | | - " read_parquet\n", |
1379 | | - " id name\n", |
1380 | | - "0 1 foo\n", |
1381 | | - "1 2 boo\n", |
1382 | | - "2 3 bar\n" |
1383 | | - ] |
1384 | | - } |
1385 | | - ], |
| 1223 | + "outputs": [], |
1386 | 1224 | "source": [ |
1387 | | - "print('# read_fwf')\n", |
1388 | | - "print(wr.s3.read_fwf(f\"s3://{bucket}/fwf/\", names=[\"id\", \"name\", \"date\"], last_modified_begin=begin_utc, last_modified_end=end_utc))\n", |
1389 | | - "print('\\n read_json')\n", |
1390 | | - "print(wr.s3.read_json(f\"s3://{bucket}/json/\", last_modified_begin=begin_utc, last_modified_end=end_utc))\n", |
1391 | | - "print('\\n read_csv')\n", |
1392 | | - "print(wr.s3.read_csv(f\"s3://{bucket}/csv/\", last_modified_begin=begin_utc, last_modified_end=end_utc))\n", |
1393 | | - "print('\\n read_parquet')\n", |
1394 | | - "print(wr.s3.read_parquet(f\"s3://{bucket}/parquet/\", last_modified_begin=begin_utc, last_modified_end=end_utc))" |
| 1225 | + "wr.s3.read_fwf(f\"s3://{bucket}/fwf/\", names=[\"id\", \"name\", \"date\"], last_modified_begin=begin_utc, last_modified_end=end_utc)\n", |
| 1226 | + "wr.s3.read_json(f\"s3://{bucket}/json/\", last_modified_begin=begin_utc, last_modified_end=end_utc)\n", |
| 1227 | + "wr.s3.read_csv(f\"s3://{bucket}/csv/\", last_modified_begin=begin_utc, last_modified_end=end_utc)\n", |
| 1228 | + "wr.s3.read_parquet(f\"s3://{bucket}/parquet/\", last_modified_begin=begin_utc, last_modified_end=end_utc);" |
1395 | 1229 | ] |
1396 | 1230 | }, |
1397 | 1231 | { |
|
1403 | 1237 | }, |
1404 | 1238 | { |
1405 | 1239 | "cell_type": "code", |
1406 | | - "execution_count": 24, |
| 1240 | + "execution_count": 22, |
1407 | 1241 | "metadata": {}, |
1408 | 1242 | "outputs": [], |
1409 | 1243 | "source": [ |
|
0 commit comments