noshot 0.1.8__py3-none-any.whl → 0.1.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,784 @@
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "markdown",
5
+ "id": "6b192e2a-14e9-4707-b1c1-e8f5aa32a919",
6
+ "metadata": {},
7
+ "source": [
8
+ "### __Import Required Libraries__"
9
+ ]
10
+ },
11
+ {
12
+ "cell_type": "code",
13
+ "execution_count": 4,
14
+ "id": "95be04fa-500c-4308-9784-b07bb42d5232",
15
+ "metadata": {},
16
+ "outputs": [],
17
+ "source": [
18
+ "import pandas as pd\n",
19
+ "import matplotlib.pyplot as plt"
20
+ ]
21
+ },
22
+ {
23
+ "cell_type": "markdown",
24
+ "id": "e5ff8a35-769d-4eda-b5f3-d3c9ba7a2dce",
25
+ "metadata": {},
26
+ "source": [
27
+ "##### __1. Importing the dataset__"
28
+ ]
29
+ },
30
+ {
31
+ "cell_type": "code",
32
+ "execution_count": 5,
33
+ "id": "69caa184-219d-4b01-8a30-1ea9ba61dcff",
34
+ "metadata": {},
35
+ "outputs": [
36
+ {
37
+ "name": "stdout",
38
+ "output_type": "stream",
39
+ "text": [
40
+ "(29580, 4)\n"
41
+ ]
42
+ }
43
+ ],
44
+ "source": [
45
+ "df = pd.read_csv('raw_sales.csv', index_col = 'datesold')\n",
46
+ "print(df.shape)"
47
+ ]
48
+ },
49
+ {
50
+ "cell_type": "markdown",
51
+ "id": "f8273eed-a0e9-4d52-a183-350a7393a290",
52
+ "metadata": {},
53
+ "source": [
54
+ "##### __2. Display the first few rows to peek at the data, the last few rows__"
55
+ ]
56
+ },
57
+ {
58
+ "cell_type": "code",
59
+ "execution_count": 3,
60
+ "id": "490892d7-df7d-4c0f-9f8a-63883ce7432f",
61
+ "metadata": {},
62
+ "outputs": [
63
+ {
64
+ "data": {
65
+ "text/html": [
66
+ "<div>\n",
67
+ "<style scoped>\n",
68
+ " .dataframe tbody tr th:only-of-type {\n",
69
+ " vertical-align: middle;\n",
70
+ " }\n",
71
+ "\n",
72
+ " .dataframe tbody tr th {\n",
73
+ " vertical-align: top;\n",
74
+ " }\n",
75
+ "\n",
76
+ " .dataframe thead th {\n",
77
+ " text-align: right;\n",
78
+ " }\n",
79
+ "</style>\n",
80
+ "<table border=\"1\" class=\"dataframe\">\n",
81
+ " <thead>\n",
82
+ " <tr style=\"text-align: right;\">\n",
83
+ " <th></th>\n",
84
+ " <th>postcode</th>\n",
85
+ " <th>price</th>\n",
86
+ " <th>propertyType</th>\n",
87
+ " <th>bedrooms</th>\n",
88
+ " </tr>\n",
89
+ " <tr>\n",
90
+ " <th>datesold</th>\n",
91
+ " <th></th>\n",
92
+ " <th></th>\n",
93
+ " <th></th>\n",
94
+ " <th></th>\n",
95
+ " </tr>\n",
96
+ " </thead>\n",
97
+ " <tbody>\n",
98
+ " <tr>\n",
99
+ " <th>2007-02-07 00:00:00</th>\n",
100
+ " <td>2607</td>\n",
101
+ " <td>525000</td>\n",
102
+ " <td>house</td>\n",
103
+ " <td>4</td>\n",
104
+ " </tr>\n",
105
+ " <tr>\n",
106
+ " <th>2007-02-27 00:00:00</th>\n",
107
+ " <td>2906</td>\n",
108
+ " <td>290000</td>\n",
109
+ " <td>house</td>\n",
110
+ " <td>3</td>\n",
111
+ " </tr>\n",
112
+ " <tr>\n",
113
+ " <th>2007-03-07 00:00:00</th>\n",
114
+ " <td>2905</td>\n",
115
+ " <td>328000</td>\n",
116
+ " <td>house</td>\n",
117
+ " <td>3</td>\n",
118
+ " </tr>\n",
119
+ " <tr>\n",
120
+ " <th>2007-03-09 00:00:00</th>\n",
121
+ " <td>2905</td>\n",
122
+ " <td>380000</td>\n",
123
+ " <td>house</td>\n",
124
+ " <td>4</td>\n",
125
+ " </tr>\n",
126
+ " <tr>\n",
127
+ " <th>2007-03-21 00:00:00</th>\n",
128
+ " <td>2906</td>\n",
129
+ " <td>310000</td>\n",
130
+ " <td>house</td>\n",
131
+ " <td>3</td>\n",
132
+ " </tr>\n",
133
+ " </tbody>\n",
134
+ "</table>\n",
135
+ "</div>"
136
+ ],
137
+ "text/plain": [
138
+ " postcode price propertyType bedrooms\n",
139
+ "datesold \n",
140
+ "2007-02-07 00:00:00 2607 525000 house 4\n",
141
+ "2007-02-27 00:00:00 2906 290000 house 3\n",
142
+ "2007-03-07 00:00:00 2905 328000 house 3\n",
143
+ "2007-03-09 00:00:00 2905 380000 house 4\n",
144
+ "2007-03-21 00:00:00 2906 310000 house 3"
145
+ ]
146
+ },
147
+ "execution_count": 3,
148
+ "metadata": {},
149
+ "output_type": "execute_result"
150
+ }
151
+ ],
152
+ "source": [
153
+ "df.head()"
154
+ ]
155
+ },
156
+ {
157
+ "cell_type": "markdown",
158
+ "id": "9c24bbd0-75f0-4eb6-863d-7960337bcb77",
159
+ "metadata": {},
160
+ "source": [
161
+ "##### __3. Print the summary statistics__"
162
+ ]
163
+ },
164
+ {
165
+ "cell_type": "code",
166
+ "execution_count": 4,
167
+ "id": "bf0037dd-41b5-4c55-ae5c-8dfa5cb11f90",
168
+ "metadata": {},
169
+ "outputs": [
170
+ {
171
+ "data": {
172
+ "text/html": [
173
+ "<div>\n",
174
+ "<style scoped>\n",
175
+ " .dataframe tbody tr th:only-of-type {\n",
176
+ " vertical-align: middle;\n",
177
+ " }\n",
178
+ "\n",
179
+ " .dataframe tbody tr th {\n",
180
+ " vertical-align: top;\n",
181
+ " }\n",
182
+ "\n",
183
+ " .dataframe thead th {\n",
184
+ " text-align: right;\n",
185
+ " }\n",
186
+ "</style>\n",
187
+ "<table border=\"1\" class=\"dataframe\">\n",
188
+ " <thead>\n",
189
+ " <tr style=\"text-align: right;\">\n",
190
+ " <th></th>\n",
191
+ " <th>count</th>\n",
192
+ " <th>mean</th>\n",
193
+ " <th>std</th>\n",
194
+ " <th>min</th>\n",
195
+ " <th>25%</th>\n",
196
+ " <th>50%</th>\n",
197
+ " <th>75%</th>\n",
198
+ " <th>max</th>\n",
199
+ " </tr>\n",
200
+ " </thead>\n",
201
+ " <tbody>\n",
202
+ " <tr>\n",
203
+ " <th>postcode</th>\n",
204
+ " <td>29580.0</td>\n",
205
+ " <td>2730.249730</td>\n",
206
+ " <td>146.717292</td>\n",
207
+ " <td>2600.0</td>\n",
208
+ " <td>2607.0</td>\n",
209
+ " <td>2615.0</td>\n",
210
+ " <td>2905.0</td>\n",
211
+ " <td>2914.0</td>\n",
212
+ " </tr>\n",
213
+ " <tr>\n",
214
+ " <th>price</th>\n",
215
+ " <td>29580.0</td>\n",
216
+ " <td>609736.262204</td>\n",
217
+ " <td>281707.905374</td>\n",
218
+ " <td>56500.0</td>\n",
219
+ " <td>440000.0</td>\n",
220
+ " <td>550000.0</td>\n",
221
+ " <td>705000.0</td>\n",
222
+ " <td>8000000.0</td>\n",
223
+ " </tr>\n",
224
+ " <tr>\n",
225
+ " <th>bedrooms</th>\n",
226
+ " <td>29580.0</td>\n",
227
+ " <td>3.250169</td>\n",
228
+ " <td>0.951275</td>\n",
229
+ " <td>0.0</td>\n",
230
+ " <td>3.0</td>\n",
231
+ " <td>3.0</td>\n",
232
+ " <td>4.0</td>\n",
233
+ " <td>5.0</td>\n",
234
+ " </tr>\n",
235
+ " </tbody>\n",
236
+ "</table>\n",
237
+ "</div>"
238
+ ],
239
+ "text/plain": [
240
+ " count mean std min 25% 50% \\\n",
241
+ "postcode 29580.0 2730.249730 146.717292 2600.0 2607.0 2615.0 \n",
242
+ "price 29580.0 609736.262204 281707.905374 56500.0 440000.0 550000.0 \n",
243
+ "bedrooms 29580.0 3.250169 0.951275 0.0 3.0 3.0 \n",
244
+ "\n",
245
+ " 75% max \n",
246
+ "postcode 2905.0 2914.0 \n",
247
+ "price 705000.0 8000000.0 \n",
248
+ "bedrooms 4.0 5.0 "
249
+ ]
250
+ },
251
+ "execution_count": 4,
252
+ "metadata": {},
253
+ "output_type": "execute_result"
254
+ }
255
+ ],
256
+ "source": [
257
+ "df.describe().T"
258
+ ]
259
+ },
260
+ {
261
+ "cell_type": "markdown",
262
+ "id": "fb7299b8-90fe-4dae-93a1-496129bc928a",
263
+ "metadata": {},
264
+ "source": [
265
+ "##### __4. Filter data for a specific year__"
266
+ ]
267
+ },
268
+ {
269
+ "cell_type": "code",
270
+ "execution_count": 6,
271
+ "id": "6a533c7b-6786-4789-9a18-0f19125de32d",
272
+ "metadata": {},
273
+ "outputs": [
274
+ {
275
+ "data": {
276
+ "text/plain": [
277
+ "522377.2108843537"
278
+ ]
279
+ },
280
+ "execution_count": 6,
281
+ "metadata": {},
282
+ "output_type": "execute_result"
283
+ }
284
+ ],
285
+ "source": [
286
+ "df.index = pd.to_datetime(df.index)\n",
287
+ "df['price'][df.index.year == 2007].mean()"
288
+ ]
289
+ },
290
+ {
291
+ "cell_type": "markdown",
292
+ "id": "111029b6-fcc9-4f5e-a9d8-833ae27c039e",
293
+ "metadata": {},
294
+ "source": [
295
+ "##### __5. Plot the average price per year__"
296
+ ]
297
+ },
298
+ {
299
+ "cell_type": "code",
300
+ "execution_count": 6,
301
+ "id": "71212203-c3e5-49ca-aa07-bbc12a2e0de6",
302
+ "metadata": {},
303
+ "outputs": [
304
+ {
305
+ "data": {
306
+ "text/plain": [
307
+ "datesold\n",
308
+ "2007 522377.210884\n",
309
+ "2008 493814.162754\n",
310
+ "2009 496092.032959\n",
311
+ "2010 559564.810289\n",
312
+ "2011 566715.110227\n",
313
+ "2012 552501.369214\n",
314
+ "2013 553416.296838\n",
315
+ "2014 592653.761439\n",
316
+ "2015 626101.342654\n",
317
+ "2016 635185.311668\n",
318
+ "2017 671880.551420\n",
319
+ "2018 660701.042768\n",
320
+ "2019 634184.218773\n",
321
+ "Name: price, dtype: float64"
322
+ ]
323
+ },
324
+ "execution_count": 6,
325
+ "metadata": {},
326
+ "output_type": "execute_result"
327
+ }
328
+ ],
329
+ "source": [
330
+ "df['price'].groupby(df.index.year).mean()"
331
+ ]
332
+ },
333
+ {
334
+ "cell_type": "markdown",
335
+ "id": "0405f26e-b564-48a2-9fb5-6d89311a363e",
336
+ "metadata": {},
337
+ "source": [
338
+ "##### __6. Count of properties sold per year__"
339
+ ]
340
+ },
341
+ {
342
+ "cell_type": "code",
343
+ "execution_count": 7,
344
+ "id": "7e1cb0fb-f494-49b1-adbc-89824b7e3855",
345
+ "metadata": {},
346
+ "outputs": [
347
+ {
348
+ "data": {
349
+ "image/png": "",
350
+ "text/plain": [
351
+ "<Figure size 640x480 with 1 Axes>"
352
+ ]
353
+ },
354
+ "metadata": {},
355
+ "output_type": "display_data"
356
+ }
357
+ ],
358
+ "source": [
359
+ "group = df.groupby(df.index.year).count()\n",
360
+ "counts = []\n",
361
+ "for val in group.values:\n",
362
+ " counts.append(val[0])\n",
363
+ "plt.bar(group.index, counts, label = 'Property_Sold/Yr')\n",
364
+ "plt.title('Property\\'s Sold Year Wise')\n",
365
+ "plt.legend()\n",
366
+ "plt.show()"
367
+ ]
368
+ },
369
+ {
370
+ "cell_type": "markdown",
371
+ "id": "d9b4c518-05ec-41ba-956d-e145efc958fd",
372
+ "metadata": {},
373
+ "source": [
374
+ "##### __7. Query for a specific date range (e.g., Jan 2010 to Dec 2015)__"
375
+ ]
376
+ },
377
+ {
378
+ "cell_type": "code",
379
+ "execution_count": 8,
380
+ "id": "17f1f390-9e5b-4bc1-882a-88d0331e3a12",
381
+ "metadata": {},
382
+ "outputs": [
383
+ {
384
+ "data": {
385
+ "text/html": [
386
+ "<div>\n",
387
+ "<style scoped>\n",
388
+ " .dataframe tbody tr th:only-of-type {\n",
389
+ " vertical-align: middle;\n",
390
+ " }\n",
391
+ "\n",
392
+ " .dataframe tbody tr th {\n",
393
+ " vertical-align: top;\n",
394
+ " }\n",
395
+ "\n",
396
+ " .dataframe thead th {\n",
397
+ " text-align: right;\n",
398
+ " }\n",
399
+ "</style>\n",
400
+ "<table border=\"1\" class=\"dataframe\">\n",
401
+ " <thead>\n",
402
+ " <tr style=\"text-align: right;\">\n",
403
+ " <th></th>\n",
404
+ " <th>postcode</th>\n",
405
+ " <th>price</th>\n",
406
+ " <th>propertyType</th>\n",
407
+ " <th>bedrooms</th>\n",
408
+ " </tr>\n",
409
+ " <tr>\n",
410
+ " <th>datesold</th>\n",
411
+ " <th></th>\n",
412
+ " <th></th>\n",
413
+ " <th></th>\n",
414
+ " <th></th>\n",
415
+ " </tr>\n",
416
+ " </thead>\n",
417
+ " <tbody>\n",
418
+ " <tr>\n",
419
+ " <th>2010-01-04</th>\n",
420
+ " <td>2615</td>\n",
421
+ " <td>435000</td>\n",
422
+ " <td>house</td>\n",
423
+ " <td>3</td>\n",
424
+ " </tr>\n",
425
+ " <tr>\n",
426
+ " <th>2010-01-05</th>\n",
427
+ " <td>2904</td>\n",
428
+ " <td>712000</td>\n",
429
+ " <td>house</td>\n",
430
+ " <td>4</td>\n",
431
+ " </tr>\n",
432
+ " <tr>\n",
433
+ " <th>2010-01-06</th>\n",
434
+ " <td>2617</td>\n",
435
+ " <td>435000</td>\n",
436
+ " <td>house</td>\n",
437
+ " <td>4</td>\n",
438
+ " </tr>\n",
439
+ " <tr>\n",
440
+ " <th>2010-01-06</th>\n",
441
+ " <td>2606</td>\n",
442
+ " <td>1350000</td>\n",
443
+ " <td>house</td>\n",
444
+ " <td>5</td>\n",
445
+ " </tr>\n",
446
+ " <tr>\n",
447
+ " <th>2010-01-07</th>\n",
448
+ " <td>2905</td>\n",
449
+ " <td>612500</td>\n",
450
+ " <td>house</td>\n",
451
+ " <td>4</td>\n",
452
+ " </tr>\n",
453
+ " <tr>\n",
454
+ " <th>...</th>\n",
455
+ " <td>...</td>\n",
456
+ " <td>...</td>\n",
457
+ " <td>...</td>\n",
458
+ " <td>...</td>\n",
459
+ " </tr>\n",
460
+ " <tr>\n",
461
+ " <th>2015-12-23</th>\n",
462
+ " <td>2603</td>\n",
463
+ " <td>415000</td>\n",
464
+ " <td>unit</td>\n",
465
+ " <td>2</td>\n",
466
+ " </tr>\n",
467
+ " <tr>\n",
468
+ " <th>2015-12-23</th>\n",
469
+ " <td>2612</td>\n",
470
+ " <td>438000</td>\n",
471
+ " <td>unit</td>\n",
472
+ " <td>2</td>\n",
473
+ " </tr>\n",
474
+ " <tr>\n",
475
+ " <th>2015-12-23</th>\n",
476
+ " <td>2612</td>\n",
477
+ " <td>450000</td>\n",
478
+ " <td>unit</td>\n",
479
+ " <td>2</td>\n",
480
+ " </tr>\n",
481
+ " <tr>\n",
482
+ " <th>2015-12-23</th>\n",
483
+ " <td>2605</td>\n",
484
+ " <td>515000</td>\n",
485
+ " <td>unit</td>\n",
486
+ " <td>2</td>\n",
487
+ " </tr>\n",
488
+ " <tr>\n",
489
+ " <th>2015-12-24</th>\n",
490
+ " <td>2900</td>\n",
491
+ " <td>365000</td>\n",
492
+ " <td>unit</td>\n",
493
+ " <td>2</td>\n",
494
+ " </tr>\n",
495
+ " </tbody>\n",
496
+ "</table>\n",
497
+ "<p>13676 rows × 4 columns</p>\n",
498
+ "</div>"
499
+ ],
500
+ "text/plain": [
501
+ " postcode price propertyType bedrooms\n",
502
+ "datesold \n",
503
+ "2010-01-04 2615 435000 house 3\n",
504
+ "2010-01-05 2904 712000 house 4\n",
505
+ "2010-01-06 2617 435000 house 4\n",
506
+ "2010-01-06 2606 1350000 house 5\n",
507
+ "2010-01-07 2905 612500 house 4\n",
508
+ "... ... ... ... ...\n",
509
+ "2015-12-23 2603 415000 unit 2\n",
510
+ "2015-12-23 2612 438000 unit 2\n",
511
+ "2015-12-23 2612 450000 unit 2\n",
512
+ "2015-12-23 2605 515000 unit 2\n",
513
+ "2015-12-24 2900 365000 unit 2\n",
514
+ "\n",
515
+ "[13676 rows x 4 columns]"
516
+ ]
517
+ },
518
+ "execution_count": 8,
519
+ "metadata": {},
520
+ "output_type": "execute_result"
521
+ }
522
+ ],
523
+ "source": [
524
+ "df2 = \n",
525
+ "df2 = df[(df.index > '1/1/2010') & (df.index <= '31/12/2015')]\n",
526
+ "df2"
527
+ ]
528
+ },
529
+ {
530
+ "cell_type": "markdown",
531
+ "id": "28c84984-a5f0-4c46-963f-5c6e3336aed9",
532
+ "metadata": {},
533
+ "source": [
534
+ "##### __8. Calculate the mean price month-wise (use Groupby)__"
535
+ ]
536
+ },
537
+ {
538
+ "cell_type": "code",
539
+ "execution_count": 9,
540
+ "id": "db344276-03ab-4fb5-bb62-5dbc0fc11852",
541
+ "metadata": {
542
+ "scrolled": true
543
+ },
544
+ "outputs": [
545
+ {
546
+ "data": {
547
+ "text/plain": [
548
+ "datesold\n",
549
+ "1 544888.799283\n",
550
+ "2 563432.444644\n",
551
+ "3 591471.616919\n",
552
+ "4 576216.768116\n",
553
+ "5 582079.192840\n",
554
+ "6 567459.933735\n",
555
+ "7 561843.308653\n",
556
+ "8 565462.996815\n",
557
+ "9 586977.304541\n",
558
+ "10 597253.885895\n",
559
+ "11 624797.507752\n",
560
+ "12 597433.875000\n",
561
+ "Name: price, dtype: float64"
562
+ ]
563
+ },
564
+ "execution_count": 9,
565
+ "metadata": {},
566
+ "output_type": "execute_result"
567
+ }
568
+ ],
569
+ "source": [
570
+ "df2['price'].groupby(df2.index.month).mean()"
571
+ ]
572
+ },
573
+ {
574
+ "cell_type": "markdown",
575
+ "id": "3f1afa45-d234-4f01-bf63-ea2a5a73f708",
576
+ "metadata": {},
577
+ "source": [
578
+ "##### __9. Perform a histogram plot__"
579
+ ]
580
+ },
581
+ {
582
+ "cell_type": "code",
583
+ "execution_count": 10,
584
+ "id": "f0d19cd6-8800-4b7b-b827-6c8fb43d72d9",
585
+ "metadata": {},
586
+ "outputs": [
587
+ {
588
+ "data": {
589
+ "image/png": "",
590
+ "text/plain": [
591
+ "<Figure size 640x480 with 1 Axes>"
592
+ ]
593
+ },
594
+ "metadata": {},
595
+ "output_type": "display_data"
596
+ }
597
+ ],
598
+ "source": [
599
+ "plt.plot(df['price'])\n",
600
+ "plt.title('Price Distribution Time-Series')\n",
601
+ "plt.show()"
602
+ ]
603
+ },
604
+ {
605
+ "cell_type": "markdown",
606
+ "id": "b33230fa-a886-4639-926a-cb60f0398745",
607
+ "metadata": {},
608
+ "source": [
609
+ "##### __10. Print the property price > 5Lakhs__"
610
+ ]
611
+ },
612
+ {
613
+ "cell_type": "code",
614
+ "execution_count": 11,
615
+ "id": "42695276-9e68-4e56-90a6-02a10e78ed14",
616
+ "metadata": {},
617
+ "outputs": [
618
+ {
619
+ "data": {
620
+ "text/html": [
621
+ "<div>\n",
622
+ "<style scoped>\n",
623
+ " .dataframe tbody tr th:only-of-type {\n",
624
+ " vertical-align: middle;\n",
625
+ " }\n",
626
+ "\n",
627
+ " .dataframe tbody tr th {\n",
628
+ " vertical-align: top;\n",
629
+ " }\n",
630
+ "\n",
631
+ " .dataframe thead th {\n",
632
+ " text-align: right;\n",
633
+ " }\n",
634
+ "</style>\n",
635
+ "<table border=\"1\" class=\"dataframe\">\n",
636
+ " <thead>\n",
637
+ " <tr style=\"text-align: right;\">\n",
638
+ " <th></th>\n",
639
+ " <th>postcode</th>\n",
640
+ " <th>price</th>\n",
641
+ " <th>propertyType</th>\n",
642
+ " <th>bedrooms</th>\n",
643
+ " </tr>\n",
644
+ " <tr>\n",
645
+ " <th>datesold</th>\n",
646
+ " <th></th>\n",
647
+ " <th></th>\n",
648
+ " <th></th>\n",
649
+ " <th></th>\n",
650
+ " </tr>\n",
651
+ " </thead>\n",
652
+ " <tbody>\n",
653
+ " <tr>\n",
654
+ " <th>2007-02-07</th>\n",
655
+ " <td>2607</td>\n",
656
+ " <td>525000</td>\n",
657
+ " <td>house</td>\n",
658
+ " <td>4</td>\n",
659
+ " </tr>\n",
660
+ " <tr>\n",
661
+ " <th>2007-04-30</th>\n",
662
+ " <td>2606</td>\n",
663
+ " <td>1530000</td>\n",
664
+ " <td>house</td>\n",
665
+ " <td>4</td>\n",
666
+ " </tr>\n",
667
+ " <tr>\n",
668
+ " <th>2007-06-27</th>\n",
669
+ " <td>2612</td>\n",
670
+ " <td>850000</td>\n",
671
+ " <td>house</td>\n",
672
+ " <td>4</td>\n",
673
+ " </tr>\n",
674
+ " <tr>\n",
675
+ " <th>2007-06-28</th>\n",
676
+ " <td>2904</td>\n",
677
+ " <td>765000</td>\n",
678
+ " <td>house</td>\n",
679
+ " <td>4</td>\n",
680
+ " </tr>\n",
681
+ " <tr>\n",
682
+ " <th>2007-06-30</th>\n",
683
+ " <td>2615</td>\n",
684
+ " <td>517000</td>\n",
685
+ " <td>house</td>\n",
686
+ " <td>4</td>\n",
687
+ " </tr>\n",
688
+ " <tr>\n",
689
+ " <th>...</th>\n",
690
+ " <td>...</td>\n",
691
+ " <td>...</td>\n",
692
+ " <td>...</td>\n",
693
+ " <td>...</td>\n",
694
+ " </tr>\n",
695
+ " <tr>\n",
696
+ " <th>2019-07-23</th>\n",
697
+ " <td>2912</td>\n",
698
+ " <td>549950</td>\n",
699
+ " <td>unit</td>\n",
700
+ " <td>3</td>\n",
701
+ " </tr>\n",
702
+ " <tr>\n",
703
+ " <th>2019-07-24</th>\n",
704
+ " <td>2601</td>\n",
705
+ " <td>590000</td>\n",
706
+ " <td>unit</td>\n",
707
+ " <td>1</td>\n",
708
+ " </tr>\n",
709
+ " <tr>\n",
710
+ " <th>2019-07-25</th>\n",
711
+ " <td>2612</td>\n",
712
+ " <td>560000</td>\n",
713
+ " <td>unit</td>\n",
714
+ " <td>2</td>\n",
715
+ " </tr>\n",
716
+ " <tr>\n",
717
+ " <th>2019-07-26</th>\n",
718
+ " <td>2601</td>\n",
719
+ " <td>589000</td>\n",
720
+ " <td>unit</td>\n",
721
+ " <td>2</td>\n",
722
+ " </tr>\n",
723
+ " <tr>\n",
724
+ " <th>2019-07-26</th>\n",
725
+ " <td>2612</td>\n",
726
+ " <td>775000</td>\n",
727
+ " <td>unit</td>\n",
728
+ " <td>2</td>\n",
729
+ " </tr>\n",
730
+ " </tbody>\n",
731
+ "</table>\n",
732
+ "<p>17873 rows × 4 columns</p>\n",
733
+ "</div>"
734
+ ],
735
+ "text/plain": [
736
+ " postcode price propertyType bedrooms\n",
737
+ "datesold \n",
738
+ "2007-02-07 2607 525000 house 4\n",
739
+ "2007-04-30 2606 1530000 house 4\n",
740
+ "2007-06-27 2612 850000 house 4\n",
741
+ "2007-06-28 2904 765000 house 4\n",
742
+ "2007-06-30 2615 517000 house 4\n",
743
+ "... ... ... ... ...\n",
744
+ "2019-07-23 2912 549950 unit 3\n",
745
+ "2019-07-24 2601 590000 unit 1\n",
746
+ "2019-07-25 2612 560000 unit 2\n",
747
+ "2019-07-26 2601 589000 unit 2\n",
748
+ "2019-07-26 2612 775000 unit 2\n",
749
+ "\n",
750
+ "[17873 rows x 4 columns]"
751
+ ]
752
+ },
753
+ "execution_count": 11,
754
+ "metadata": {},
755
+ "output_type": "execute_result"
756
+ }
757
+ ],
758
+ "source": [
759
+ "df[df['price'] > 500000]"
760
+ ]
761
+ }
762
+ ],
763
+ "metadata": {
764
+ "kernelspec": {
765
+ "display_name": "Python 3 (ipykernel)",
766
+ "language": "python",
767
+ "name": "python3"
768
+ },
769
+ "language_info": {
770
+ "codemirror_mode": {
771
+ "name": "ipython",
772
+ "version": 3
773
+ },
774
+ "file_extension": ".py",
775
+ "mimetype": "text/x-python",
776
+ "name": "python",
777
+ "nbconvert_exporter": "python",
778
+ "pygments_lexer": "ipython3",
779
+ "version": "3.11.7"
780
+ }
781
+ },
782
+ "nbformat": 4,
783
+ "nbformat_minor": 5
784
+ }