#po potrebi instaliraj paket
#!pip install pandas-profiling
import pandas as pd
import pandas_profiling as pp
Naložim podatke:
df = pd.read_csv(r"D:\OneDrive\GitHub\slanad_blog\static\data\2019-05-04_listings.csv")
df.describe()
id | host_id | neighbourhood_group | latitude | longitude | price | minimum_nights | number_of_reviews | reviews_per_month | calculated_host_listings_count | availability_365 | |
---|---|---|---|---|---|---|---|---|---|---|---|
count | 1.127600e+04 | 1.127600e+04 | 0.0 | 11276.000000 | 11276.000000 | 11276.000000 | 11276.000000 | 11276.000000 | 9394.000000 | 11276.000000 | 11276.000000 |
mean | 1.791508e+07 | 6.831232e+07 | NaN | 48.206394 | 16.360991 | 77.850656 | 4.237052 | 28.989447 | 1.757868 | 5.768358 | 142.674885 |
std | 9.416062e+06 | 6.912654e+07 | NaN | 0.019361 | 0.034110 | 134.397362 | 17.971762 | 51.325959 | 1.917504 | 12.645909 | 135.123864 |
min | 2.309000e+03 | 2.522000e+03 | NaN | 48.125848 | 16.190898 | 9.000000 | 1.000000 | 0.000000 | 0.010000 | 1.000000 | 0.000000 |
25% | 1.010131e+07 | 1.073092e+07 | NaN | 48.192638 | 16.340987 | 38.000000 | 1.000000 | 2.000000 | 0.350000 | 1.000000 | 0.000000 |
50% | 1.929118e+07 | 3.845697e+07 | NaN | 48.206156 | 16.358773 | 56.000000 | 2.000000 | 9.000000 | 1.000000 | 1.000000 | 99.000000 |
75% | 2.596927e+07 | 1.132267e+08 | NaN | 48.219206 | 16.379510 | 85.000000 | 3.000000 | 32.000000 | 2.590000 | 4.000000 | 281.000000 |
max | 3.224153e+07 | 2.419409e+08 | NaN | 48.298573 | 16.546787 | 9270.000000 | 1000.000000 | 514.000000 | 14.230000 | 85.000000 | 365.000000 |
pp.ProfileReport(df)
Dataset info
Number of variables | 16 |
---|---|
Number of observations | 11276 |
Total Missing (%) | 8.3% |
Total size in memory | 1.4 MiB |
Average record size in memory | 128.0 B |
Variables types
Numeric | 10 |
---|---|
Categorical | 5 |
Boolean | 0 |
Date | 0 |
Text (Unique) | 0 |
Rejected | 1 |
Unsupported | 0 |
Warnings
availability_365
has 2977 / 26.4% zeros Zeroshost_name
has a high cardinality: 2978 distinct values Warninglast_review
has 1882 / 16.7% missing values Missinglast_review
has a high cardinality: 1017 distinct values Warningminimum_nights
is highly skewed (γ1 = 34.34) Skewedname
has a high cardinality: 11051 distinct values Warningneighbourhood_group
has 11276 / 100.0% missing values Missingneighbourhood_group
has constant value Rejectednumber_of_reviews
has 1882 / 16.7% zeros Zerosprice
is highly skewed (γ1 = 36.36) Skewedreviews_per_month
has 1882 / 16.7% missing values Missingavailability_365
Numeric
Distinct count | 366 |
---|---|
Unique (%) | 3.2% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 142.67 |
---|---|
Minimum | 0 |
Maximum | 365 |
Zeros (%) | 26.4% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 99 |
Q3 | 281 |
95-th percentile | 362 |
Maximum | 365 |
Range | 365 |
Interquartile range | 281 |
Descriptive statistics
Standard deviation | 135.12 |
---|---|
Coef of variation | 0.94708 |
Kurtosis | -1.4436 |
Mean | 142.67 |
MAD | 122.54 |
Skewness | 0.36892 |
Sum | 1608802 |
Variance | 18258 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
0 | 2977 | 26.4% |
|
365 | 291 | 2.6% |
|
364 | 162 | 1.4% |
|
90 | 104 | 0.9% |
|
363 | 85 | 0.8% |
|
362 | 85 | 0.8% |
|
39 | 81 | 0.7% |
|
89 | 79 | 0.7% |
|
180 | 74 | 0.7% |
|
345 | 70 | 0.6% |
|
Other values (356) | 7268 | 64.5% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
0 | 2977 | 26.4% |
|
1 | 63 | 0.6% |
|
2 | 50 | 0.4% |
|
3 | 36 | 0.3% |
|
4 | 43 | 0.4% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
361 | 32 | 0.3% |
|
362 | 85 | 0.8% |
|
363 | 85 | 0.8% |
|
364 | 162 | 1.4% |
|
365 | 291 | 2.6% |
|
calculated_host_listings_count
Numeric
Distinct count | 37 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.7684 |
---|---|
Minimum | 1 |
Maximum | 85 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 4 |
95-th percentile | 29 |
Maximum | 85 |
Range | 84 |
Interquartile range | 3 |
Descriptive statistics
Standard deviation | 12.646 |
---|---|
Coef of variation | 2.1923 |
Kurtosis | 19.289 |
Mean | 5.7684 |
MAD | 6.7004 |
Skewness | 4.1898 |
Sum | 65044 |
Variance | 159.92 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
1 | 6119 | 54.3% |
|
2 | 1470 | 13.0% |
|
3 | 774 | 6.9% |
|
4 | 384 | 3.4% |
|
5 | 310 | 2.7% |
|
7 | 231 | 2.0% |
|
6 | 210 | 1.9% |
|
8 | 192 | 1.7% |
|
9 | 126 | 1.1% |
|
12 | 108 | 1.0% |
|
Other values (27) | 1352 | 12.0% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
1 | 6119 | 54.3% |
|
2 | 1470 | 13.0% |
|
3 | 774 | 6.9% |
|
4 | 384 | 3.4% |
|
5 | 310 | 2.7% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
51 | 51 | 0.5% |
|
53 | 53 | 0.5% |
|
56 | 56 | 0.5% |
|
77 | 77 | 0.7% |
|
85 | 85 | 0.8% |
|
host_id
Numeric
Distinct count | 7448 |
---|---|
Unique (%) | 66.1% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 68312000 |
---|---|
Minimum | 2522 |
Maximum | 241940896 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 2522 |
---|---|
5-th percentile | 1547100 |
Q1 | 10731000 |
Median | 38457000 |
Q3 | 113230000 |
95-th percentile | 214870000 |
Maximum | 241940896 |
Range | 241938374 |
Interquartile range | 102500000 |
Descriptive statistics
Standard deviation | 69127000 |
---|---|
Coef of variation | 1.0119 |
Kurtosis | -0.29134 |
Mean | 68312000 |
MAD | 58264000 |
Skewness | 0.96756 |
Sum | 770289687845 |
Variance | 4778500000000000 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
8632750 | 85 | 0.8% |
|
2816192 | 77 | 0.7% |
|
54441651 | 56 | 0.5% |
|
5874520 | 53 | 0.5% |
|
518644 | 51 | 0.5% |
|
4331202 | 46 | 0.4% |
|
1547126 | 35 | 0.3% |
|
37769736 | 34 | 0.3% |
|
162761604 | 31 | 0.3% |
|
17712311 | 31 | 0.3% |
|
Other values (7438) | 10777 | 95.6% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
2522 | 1 | 0.0% |
|
5783 | 2 | 0.0% |
|
19997 | 1 | 0.0% |
|
22467 | 1 | 0.0% |
|
45425 | 2 | 0.0% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
241836874 | 1 | 0.0% |
|
241838343 | 1 | 0.0% |
|
241840731 | 1 | 0.0% |
|
241846485 | 1 | 0.0% |
|
241940896 | 1 | 0.0% |
|
host_name
Categorical
Distinct count | 2978 |
---|---|
Unique (%) | 26.4% |
Missing (%) | 0.0% |
Missing (n) | 3 |
Michael |
|
---|---|
Martin |
|
Andreas |
|
Other values (2974) |
10762
|
Value | Count | Frequency (%) | |
Michael | 175 | 1.6% |
|
Martin | 174 | 1.5% |
|
Andreas | 162 | 1.4% |
|
Anna | 96 | 0.9% |
|
Christian | 88 | 0.8% |
|
Florian | 86 | 0.8% |
|
Julia | 80 | 0.7% |
|
Stefan | 80 | 0.7% |
|
Peter | 77 | 0.7% |
|
Thomas | 77 | 0.7% |
|
Other values (2967) | 10178 | 90.3% |
|
id
Numeric
Distinct count | 11276 |
---|---|
Unique (%) | 100.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 17915000 |
---|---|
Minimum | 2309 |
Maximum | 32241530 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 2309 |
---|---|
5-th percentile | 1443700 |
Q1 | 10101000 |
Median | 19291000 |
Q3 | 25969000 |
95-th percentile | 31198000 |
Maximum | 32241530 |
Range | 32239221 |
Interquartile range | 15868000 |
Descriptive statistics
Standard deviation | 9416100 |
---|---|
Coef of variation | 0.52559 |
Kurtosis | -1.0707 |
Mean | 17915000 |
MAD | 8034500 |
Skewness | -0.29325 |
Sum | 202010479906 |
Variance | 88662000000000 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
27478015 | 1 | 0.0% |
|
31605802 | 1 | 0.0% |
|
222614 | 1 | 0.0% |
|
11996563 | 1 | 0.0% |
|
673170 | 1 | 0.0% |
|
531857 | 1 | 0.0% |
|
26547600 | 1 | 0.0% |
|
15445391 | 1 | 0.0% |
|
23285541 | 1 | 0.0% |
|
1722869 | 1 | 0.0% |
|
Other values (11266) | 11266 | 99.9% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
2309 | 1 | 0.0% |
|
15883 | 1 | 0.0% |
|
38768 | 1 | 0.0% |
|
40625 | 1 | 0.0% |
|
51287 | 1 | 0.0% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
32238075 | 1 | 0.0% |
|
32238907 | 1 | 0.0% |
|
32241000 | 1 | 0.0% |
|
32241254 | 1 | 0.0% |
|
32241530 | 1 | 0.0% |
|
last_review
Categorical
Distinct count | 1017 |
---|---|
Unique (%) | 9.0% |
Missing (%) | 16.7% |
Missing (n) | 1882 |
2019-01-02 |
|
---|---|
2019-01-01 |
|
2019-01-03 |
|
Other values (1013) |
8234
|
(Missing) |
1882
|
Value | Count | Frequency (%) | |
2019-01-02 | 482 | 4.3% |
|
2019-01-01 | 370 | 3.3% |
|
2019-01-03 | 308 | 2.7% |
|
2019-02-03 | 288 | 2.6% |
|
2019-01-04 | 243 | 2.2% |
|
2019-01-06 | 223 | 2.0% |
|
2019-01-20 | 222 | 2.0% |
|
2019-01-27 | 208 | 1.8% |
|
2019-01-05 | 183 | 1.6% |
|
2019-02-04 | 137 | 1.2% |
|
Other values (1006) | 6730 | 59.7% |
|
(Missing) | 1882 | 16.7% |
|
latitude
Numeric
Distinct count | 11276 |
---|---|
Unique (%) | 100.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 48.206 |
---|---|
Minimum | 48.126 |
Maximum | 48.299 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 48.126 |
---|---|
5-th percentile | 48.177 |
Q1 | 48.193 |
Median | 48.206 |
Q3 | 48.219 |
95-th percentile | 48.237 |
Maximum | 48.299 |
Range | 0.17273 |
Interquartile range | 0.026568 |
Descriptive statistics
Standard deviation | 0.019361 |
---|---|
Coef of variation | 0.00040162 |
Kurtosis | 0.89116 |
Mean | 48.206 |
MAD | 0.01537 |
Skewness | 0.2306 |
Sum | 543580 |
Variance | 0.00037484 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
48.2336551073448 | 1 | 0.0% |
|
48.2064998938564 | 1 | 0.0% |
|
48.20861780925839 | 1 | 0.0% |
|
48.2001944308107 | 1 | 0.0% |
|
48.194082532857536 | 1 | 0.0% |
|
48.23273813763047 | 1 | 0.0% |
|
48.22726068198479 | 1 | 0.0% |
|
48.20625615668543 | 1 | 0.0% |
|
48.21057288277489 | 1 | 0.0% |
|
48.17898367055073 | 1 | 0.0% |
|
Other values (11266) | 11266 | 99.9% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
48.12584773082685 | 1 | 0.0% |
|
48.127215541553575 | 1 | 0.0% |
|
48.12802821076231 | 1 | 0.0% |
|
48.12817621297169 | 1 | 0.0% |
|
48.128312506896975 | 1 | 0.0% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
48.288447052755615 | 1 | 0.0% |
|
48.28892879656033 | 1 | 0.0% |
|
48.29041636614624 | 1 | 0.0% |
|
48.294597566084086 | 1 | 0.0% |
|
48.298572734125635 | 1 | 0.0% |
|
longitude
Numeric
Distinct count | 11276 |
---|---|
Unique (%) | 100.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 16.361 |
---|---|
Minimum | 16.191 |
Maximum | 16.547 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 16.191 |
---|---|
5-th percentile | 16.312 |
Q1 | 16.341 |
Median | 16.359 |
Q3 | 16.38 |
95-th percentile | 16.41 |
Maximum | 16.547 |
Range | 0.35589 |
Interquartile range | 0.038523 |
Descriptive statistics
Standard deviation | 0.03411 |
---|---|
Coef of variation | 0.0020849 |
Kurtosis | 4.7539 |
Mean | 16.361 |
MAD | 0.024842 |
Skewness | 0.79622 |
Sum | 184490 |
Variance | 0.0011635 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
16.342352399882813 | 1 | 0.0% |
|
16.352019635959465 | 1 | 0.0% |
|
16.36066044451892 | 1 | 0.0% |
|
16.397024752710358 | 1 | 0.0% |
|
16.381250994038005 | 1 | 0.0% |
|
16.323166397156534 | 1 | 0.0% |
|
16.385078685702723 | 1 | 0.0% |
|
16.349879422559475 | 1 | 0.0% |
|
16.374395517305018 | 1 | 0.0% |
|
16.38563390964956 | 1 | 0.0% |
|
Other values (11266) | 11266 | 99.9% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
16.190897740928744 | 1 | 0.0% |
|
16.194535902710175 | 1 | 0.0% |
|
16.196278362407188 | 1 | 0.0% |
|
16.204514395161752 | 1 | 0.0% |
|
16.208645989414812 | 1 | 0.0% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
16.54668250895395 | 1 | 0.0% |
|
16.54672497637489 | 1 | 0.0% |
|
16.546724979514845 | 1 | 0.0% |
|
16.546741469300017 | 1 | 0.0% |
|
16.546786535612462 | 1 | 0.0% |
|
minimum_nights
Numeric
Distinct count | 58 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 4.2371 |
---|---|
Minimum | 1 |
Maximum | 1000 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 2 |
Q3 | 3 |
95-th percentile | 13 |
Maximum | 1000 |
Range | 999 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 17.972 |
---|---|
Coef of variation | 4.2416 |
Kurtosis | 1723.9 |
Mean | 4.2371 |
MAD | 4.0564 |
Skewness | 34.34 |
Sum | 47777 |
Variance | 322.98 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
1 | 3725 | 33.0% |
|
2 | 3674 | 32.6% |
|
3 | 2001 | 17.7% |
|
4 | 497 | 4.4% |
|
5 | 326 | 2.9% |
|
7 | 257 | 2.3% |
|
30 | 149 | 1.3% |
|
6 | 120 | 1.1% |
|
14 | 97 | 0.9% |
|
10 | 69 | 0.6% |
|
Other values (48) | 361 | 3.2% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
1 | 3725 | 33.0% |
|
2 | 3674 | 32.6% |
|
3 | 2001 | 17.7% |
|
4 | 497 | 4.4% |
|
5 | 326 | 2.9% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
214 | 1 | 0.0% |
|
300 | 2 | 0.0% |
|
365 | 2 | 0.0% |
|
999 | 1 | 0.0% |
|
1000 | 1 | 0.0% |
|
name
Categorical
Distinct count | 11051 |
---|---|
Unique (%) | 98.0% |
Missing (%) | 0.2% |
Missing (n) | 18 |
Cozy apartment in the heart of Vienna |
|
---|---|
City Center Apartment |
|
City Pension Stephansplatz |
|
Other values (11047) |
11242
|
(Missing) |
|
Value | Count | Frequency (%) | |
Cozy apartment in the heart of Vienna | 6 | 0.1% |
|
City Center Apartment | 5 | 0.0% |
|
City Pension Stephansplatz | 5 | 0.0% |
|
Wien Wohnung | 5 | 0.0% |
|
Central Private Room | 5 | 0.0% |
|
Adelin Pension und Zimmervermietung | 5 | 0.0% |
|
1 Bedroom Apartment with Balcony | 4 | 0.0% |
|
Charming Studio | 4 | 0.0% |
|
Vienna Dream Apartments | 4 | 0.0% |
|
Family Apartment | 4 | 0.0% |
|
Other values (11040) | 11211 | 99.4% |
|
(Missing) | 18 | 0.2% |
|
neighbourhood
Categorical
Distinct count | 23 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Leopoldstadt |
|
---|---|
Landstra§e |
|
Alsergrund |
|
Other values (20) |
8309
|
Value | Count | Frequency (%) | |
Leopoldstadt | 1223 | 10.8% |
|
Landstra§e | 972 | 8.6% |
|
Alsergrund | 772 | 6.8% |
|
Neubau | 731 | 6.5% |
|
Margareten | 728 | 6.5% |
|
Innere Stadt | 714 | 6.3% |
|
Rudolfsheim-Fnfhaus | 675 | 6.0% |
|
Mariahilf | 576 | 5.1% |
|
Favoriten | 554 | 4.9% |
|
Wieden | 548 | 4.9% |
|
Other values (13) | 3783 | 33.5% |
|
neighbourhood_group
Constant
This variable is constant and should be ignored for analysis
Constant value |
---|
number_of_reviews
Numeric
Distinct count | 324 |
---|---|
Unique (%) | 2.9% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 28.989 |
---|---|
Minimum | 0 |
Maximum | 514 |
Zeros (%) | 16.7% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 2 |
Median | 9 |
Q3 | 32 |
95-th percentile | 130 |
Maximum | 514 |
Range | 514 |
Interquartile range | 30 |
Descriptive statistics
Standard deviation | 51.326 |
---|---|
Coef of variation | 1.7705 |
Kurtosis | 14.779 |
Mean | 28.989 |
MAD | 32.382 |
Skewness | 3.3696 |
Sum | 326885 |
Variance | 2634.4 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
0 | 1882 | 16.7% |
|
1 | 925 | 8.2% |
|
2 | 658 | 5.8% |
|
3 | 531 | 4.7% |
|
4 | 418 | 3.7% |
|
5 | 368 | 3.3% |
|
7 | 314 | 2.8% |
|
6 | 300 | 2.7% |
|
9 | 237 | 2.1% |
|
8 | 227 | 2.0% |
|
Other values (314) | 5416 | 48.0% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
0 | 1882 | 16.7% |
|
1 | 925 | 8.2% |
|
2 | 658 | 5.8% |
|
3 | 531 | 4.7% |
|
4 | 418 | 3.7% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
460 | 1 | 0.0% |
|
463 | 1 | 0.0% |
|
471 | 1 | 0.0% |
|
501 | 1 | 0.0% |
|
514 | 1 | 0.0% |
|
price
Numeric
Distinct count | 282 |
---|---|
Unique (%) | 2.5% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 77.851 |
---|---|
Minimum | 9 |
Maximum | 9270 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 9 |
---|---|
5-th percentile | 22 |
Q1 | 38 |
Median | 56 |
Q3 | 85 |
95-th percentile | 185 |
Maximum | 9270 |
Range | 9261 |
Interquartile range | 47 |
Descriptive statistics
Standard deviation | 134.4 |
---|---|
Coef of variation | 1.7263 |
Kurtosis | 2193.3 |
Mean | 77.851 |
MAD | 45.459 |
Skewness | 36.36 |
Sum | 877844 |
Variance | 18063 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
50 | 459 | 4.1% |
|
40 | 417 | 3.7% |
|
60 | 403 | 3.6% |
|
30 | 398 | 3.5% |
|
45 | 396 | 3.5% |
|
35 | 392 | 3.5% |
|
55 | 335 | 3.0% |
|
80 | 306 | 2.7% |
|
25 | 306 | 2.7% |
|
65 | 301 | 2.7% |
|
Other values (272) | 7563 | 67.1% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
9 | 1 | 0.0% |
|
10 | 14 | 0.1% |
|
11 | 6 | 0.1% |
|
12 | 14 | 0.1% |
|
13 | 11 | 0.1% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
1250 | 1 | 0.0% |
|
1510 | 1 | 0.0% |
|
2500 | 1 | 0.0% |
|
5500 | 1 | 0.0% |
|
9270 | 1 | 0.0% |
|
reviews_per_month
Numeric
Distinct count | 834 |
---|---|
Unique (%) | 7.4% |
Missing (%) | 16.7% |
Missing (n) | 1882 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.7579 |
---|---|
Minimum | 0.01 |
Maximum | 14.23 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 0.01 |
---|---|
5-th percentile | 0.06 |
Q1 | 0.35 |
Median | 1 |
Q3 | 2.59 |
95-th percentile | 5.81 |
Maximum | 14.23 |
Range | 14.22 |
Interquartile range | 2.24 |
Descriptive statistics
Standard deviation | 1.9175 |
---|---|
Coef of variation | 1.0908 |
Kurtosis | 2.8395 |
Mean | 1.7579 |
MAD | 1.4816 |
Skewness | 1.6364 |
Sum | 16513 |
Variance | 3.6768 |
Memory size | 88.2 KiB |
Value | Count | Frequency (%) | |
0.03 | 126 | 1.1% |
|
1.0 | 120 | 1.1% |
|
0.07 | 118 | 1.0% |
|
0.05 | 115 | 1.0% |
|
0.15 | 98 | 0.9% |
|
0.06 | 95 | 0.8% |
|
0.1 | 90 | 0.8% |
|
0.16 | 87 | 0.8% |
|
0.11 | 87 | 0.8% |
|
0.02 | 79 | 0.7% |
|
Other values (823) | 8379 | 74.3% |
|
(Missing) | 1882 | 16.7% |
|
Minimum 5 values
Value | Count | Frequency (%) | |
0.01 | 1 | 0.0% |
|
0.02 | 79 | 0.7% |
|
0.03 | 126 | 1.1% |
|
0.04 | 68 | 0.6% |
|
0.05 | 115 | 1.0% |
|
Maximum 5 values
Value | Count | Frequency (%) | |
11.79 | 1 | 0.0% |
|
12.15 | 1 | 0.0% |
|
12.8 | 1 | 0.0% |
|
14.0 | 1 | 0.0% |
|
14.23 | 1 | 0.0% |
|
room_type
Categorical
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Entire home/apt |
8173
|
---|---|
Private room |
3005
|
Shared room |
|
Value | Count | Frequency (%) | |
Entire home/apt | 8173 | 72.5% |
|
Private room | 3005 | 26.6% |
|
Shared room | 98 | 0.9% |
|
id | name | host_id | host_name | neighbourhood_group | neighbourhood | latitude | longitude | room_type | price | minimum_nights | number_of_reviews | last_review | reviews_per_month | calculated_host_listings_count | availability_365 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 2309 | Greenview Design Apartment | 2522 | Chris | NaN | Leopoldstadt | 48.202814 | 16.404353 | Entire home/apt | 80 | 4 | 66 | 2018-06-03 | 0.62 | 1 | 338 |
1 | 15883 | b&b near Old Danube river | 62142 | Eva | NaN | Donaustadt | 48.241436 | 16.428118 | Private room | 85 | 1 | 9 | 2018-01-03 | 0.19 | 5 | 287 |
2 | 38768 | central cityapartement- wifi- nice neighbourhood | 166283 | Hannes | NaN | Leopoldstadt | 48.218225 | 16.379255 | Entire home/apt | 65 | 3 | 271 | 2019-01-05 | 2.82 | 2 | 129 |
3 | 40625 | Near Palace Schönbrunn, Apt. 1 | 175131 | Ingela | NaN | Rudolfsheim-Fnfhaus | 48.184862 | 16.327401 | Entire home/apt | 99 | 1 | 128 | 2019-01-07 | 1.23 | 13 | 291 |
4 | 51287 | little studio- next to citycenter- wifi- nice ... | 166283 | Hannes | NaN | Leopoldstadt | 48.218514 | 16.377810 | Entire home/apt | 60 | 3 | 243 | 2019-01-08 | 2.48 | 2 | 146 |