{ "cells": [ { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "0.7747386150504332\n", "5207\n" ] }, { "data": { "text/plain": [ "array(['House', 'Condominium', 'Townhouse', 'Apartment', 'Other', 'Loft',\n", " 'Guest suite', 'Guesthouse', 'In-law', 'Boutique hotel', 'Boat',\n", " 'Hostel', 'Bed & Breakfast', 'Dorm', 'Timeshare',\n", " 'Serviced apartment', 'Vacation home', 'Bungalow', 'Villa'],\n", " dtype=object)" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import pandas as pd\n", "import random\n", "print(random.uniform(0, 1))\n", "df = pd.read_csv('Airbnb_data/listings_SanFan.csv')\n", "print(len(df))\n", "len(df['last_scraped'].unique())\n", "# s = pd.Series(np.random.randn())\n", "# a = pd.DataFrame(np.random.randn(0,1), columns=list('Occupancy Rate'))\n", "# df['Occupancy Rate'] = random.uniform(0, 1)\n", "df.head()\n", "df['property_type'].unique()" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | price | \n", "accommodates | \n", "host_response_time | \n", "bathrooms | \n", "bedrooms | \n", "beds | \n", "security_deposit | \n", "cleaning_fee | \n", "guests_included | \n", "extra_people | \n", "... | \n", "review_scores_checkin | \n", "review_scores_communication | \n", "review_scores_location | \n", "review_scores_value | \n", "house_rules | \n", "amenities | \n", "bed_type | \n", "room_type | \n", "cancellation_policy | \n", "property_type | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "$56.00 | \n", "4 | \n", "within an hour | \n", "1.0 | \n", "1.0 | \n", "2.0 | \n", "$100.00 | \n", "$30.00 | \n", "2 | \n", "$15.00 | \n", "... | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "- Private bathroom is on the first floor (slig... | \n", "{TV,\"Cable TV\",\"Wireless Internet\",\"Air condit... | \n", "Real Bed | \n", "Private room | \n", "moderate | \n", "House | \n", "
1 | \n", "$36.00 | \n", "2 | \n", "within an hour | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "$100.00 | \n", "$35.00 | \n", "1 | \n", "$20.00 | \n", "... | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "1. NO SMOKING! This rule applies for inside ou... | \n", "{TV,\"Wireless Internet\",\"Air conditioning\",Kit... | \n", "Real Bed | \n", "Private room | \n", "strict | \n", "Condominium | \n", "
2 | \n", "$80.00 | \n", "6 | \n", "within an hour | \n", "1.5 | \n", "2.0 | \n", "3.0 | \n", "$150.00 | \n", "$65.00 | \n", "4 | \n", "$15.00 | \n", "... | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "I don't ask much, just to please respect the s... | \n", "{TV,\"Cable TV\",Internet,\"Wireless Internet\",\"A... | \n", "Real Bed | \n", "Private room | \n", "moderate | \n", "Townhouse | \n", "
3 | \n", "$80.00 | \n", "2 | \n", "within a few hours | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "$100.00 | \n", "$10.00 | \n", "2 | \n", "$10.00 | \n", "... | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "Guests should treat my condo as their home wit... | \n", "{TV,\"Cable TV\",Internet,\"Wireless Internet\",\"A... | \n", "Real Bed | \n", "Private room | \n", "flexible | \n", "Condominium | \n", "
4 | \n", "$20.00 | \n", "3 | \n", "within an hour | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "$100.00 | \n", "$50.00 | \n", "1 | \n", "$10.00 | \n", "... | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "9.0 | \n", "If using the kitchen please clean up after you... | \n", "{TV,\"Cable TV\",Internet,\"Wireless Internet\",\"A... | \n", "Real Bed | \n", "Private room | \n", "strict | \n", "Apartment | \n", "
5 rows × 27 columns
\n", "\n", " | price | \n", "accommodates | \n", "bathrooms | \n", "bedrooms | \n", "beds | \n", "security_deposit | \n", "cleaning_fee | \n", "guests_included | \n", "extra_people | \n", "minimum_nights | \n", "... | \n", "Dorm | \n", "Timeshare | \n", "Serviced apartment | \n", "Vacation home | \n", "Bungalow | \n", "Villa | \n", "within an hour | \n", "within a few hours | \n", "within a day | \n", "a few days or more | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "56.0 | \n", "4 | \n", "1.0 | \n", "1.0 | \n", "2.0 | \n", "100.0 | \n", "30.0 | \n", "2 | \n", "15.0 | \n", "2 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
1 | \n", "36.0 | \n", "2 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "100.0 | \n", "35.0 | \n", "1 | \n", "20.0 | \n", "1 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
2 | \n", "80.0 | \n", "6 | \n", "1.5 | \n", "2.0 | \n", "3.0 | \n", "150.0 | \n", "65.0 | \n", "4 | \n", "15.0 | \n", "1 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
3 | \n", "80.0 | \n", "2 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "100.0 | \n", "10.0 | \n", "2 | \n", "10.0 | \n", "2 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "
4 | \n", "20.0 | \n", "3 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "100.0 | \n", "50.0 | \n", "1 | \n", "10.0 | \n", "3 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
5 rows × 121 columns
\n", "