# First, let's import the needed libraries.
import matplotlib.pyplot as plt
import numpy as np
import random
import pandas as pd
import geopandas as gpd
import folium


berlin_features = gpd.read_file("C:/Users/mceck/soga/Soga-Py/300/data/osm_pois_p.zip")

berlin_features.head()


berlin_features.dtypes

osm_id        object
code           int64
fclass        object
name          object
geometry    geometry
dtype: object


berlin_features.geometry

0        POINT (13.34544 52.54644)
1        POINT (13.32282 52.50691)
2        POINT (13.32214 52.50645)
3        POINT (13.31808 52.50621)
4        POINT (13.32078 52.50732)
                   ...            
82486    POINT (13.29562 52.43827)
82487    POINT (13.29558 52.43829)
82488    POINT (13.31360 52.47638)
82489    POINT (13.63331 52.52282)
82490    POINT (13.49256 52.54817)
Name: geometry, Length: 82491, dtype: geometry


berlin_features.columns

Index(['osm_id', 'code', 'fclass', 'name', 'geometry'], dtype='object')


set(berlin_features["fclass"])  ## get unique values

{'archaeological',
 'arts_centre',
 'artwork',
 'atm',
 'attraction',
 'bakery',
 'bank',
 'bar',
 'battlefield',
 'beauty_shop',
 'bench',
 'beverages',
 'bicycle_rental',
 'bicycle_shop',
 'biergarten',
 'bookshop',
 'butcher',
 'cafe',
 'camera_surveillance',
 'camp_site',
 'car_dealership',
 'car_rental',
 'car_sharing',
 'car_wash',
 'caravan_site',
 'chalet',
 'chemist',
 'cinema',
 'clinic',
 'clothes',
 'college',
 'comms_tower',
 'community_centre',
 'computer_shop',
 'convenience',
 'courthouse',
 'dentist',
 'department_store',
 'doctors',
 'dog_park',
 'doityourself',
 'drinking_water',
 'embassy',
 'fast_food',
 'fire_station',
 'florist',
 'food_court',
 'fountain',
 'furniture_shop',
 'garden_centre',
 'general',
 'gift_shop',
 'golf_course',
 'graveyard',
 'greengrocer',
 'guesthouse',
 'hairdresser',
 'hospital',
 'hostel',
 'hotel',
 'hunting_stand',
 'jeweller',
 'kindergarten',
 'kiosk',
 'laundry',
 'library',
 'mall',
 'market_place',
 'memorial',
 'mobile_phone_shop',
 'monument',
 'motel',
 'museum',
 'newsagent',
 'nightclub',
 'nursing_home',
 'observation_tower',
 'optician',
 'outdoor_shop',
 'park',
 'pharmacy',
 'picnic_site',
 'pitch',
 'playground',
 'police',
 'post_box',
 'post_office',
 'prison',
 'pub',
 'recycling',
 'recycling_clothes',
 'recycling_glass',
 'recycling_paper',
 'restaurant',
 'ruins',
 'school',
 'shelter',
 'shoe_shop',
 'sports_centre',
 'sports_shop',
 'stadium',
 'stationery',
 'supermarket',
 'swimming_pool',
 'telephone',
 'theatre',
 'theme_park',
 'toilet',
 'tourist_info',
 'tower',
 'town_hall',
 'toy_shop',
 'track',
 'travel_agent',
 'university',
 'vending_any',
 'vending_cigarette',
 'vending_machine',
 'vending_parking',
 'veterinary',
 'video_shop',
 'viewpoint',
 'waste_basket',
 'water_mill',
 'water_tower',
 'water_well',
 'water_works',
 'wayside_cross',
 'wayside_shrine',
 'zoo'}


berlin_locations = berlin_features[
    (berlin_features["fclass"] == "nightclub") | (berlin_features["fclass"] == "bar")
]


plt.figure(figsize=(8, 6))
berlin_locations["fclass"].value_counts(normalize=True).plot(
    kind="bar"
)  ## plot relative frequency
plt.xticks(rotation=0)

(array([0, 1]), [Text(0, 0, 'bar'), Text(1, 0, 'nightclub')])


berlin_locations["fclass"].value_counts()

bar          806
nightclub    131
Name: fclass, dtype: int64


berlinmap = folium.Map([52.5464450, 13.34544], zoom_start=10, tiles="cartodbpositron")

group0 = folium.FeatureGroup(name='<span style=\\"color: red;\\">nightclub</span>')
group1 = folium.FeatureGroup(name='<span style=\\"color: darkblue;\\">bar</span>')

for _, row in berlin_locations.iterrows():
    if row["fclass"] == "nightclub":
        folium.CircleMarker(
            [row.geometry.y, row.geometry.x],
            popup=row["name"],
            radius=3,
            color="red",
        ).add_to(group0)
    elif row["fclass"] == "bar":
        folium.CircleMarker(
            [row.geometry.y, row.geometry.x],
            popup=row["name"],
            radius=3,
            color="darkblue",
        ).add_to(group1)

group0.add_to(berlinmap)
group1.add_to(berlinmap)
folium.map.LayerControl("topright", collapsed=False).add_to(berlinmap)

berlinmap


berlin_locations = berlin_locations.to_crs(
    "EPSG:25832"
)  # or use world.to_crs(epsg=25832)

# get information about crs
berlin_locations.crs

<Derived Projected CRS: EPSG:25832>
Name: ETRS89 / UTM zone 32N
Axis Info [cartesian]:
- E[east]: Easting (metre)
- N[north]: Northing (metre)
Area of Use:
- name: Europe between 6°E and 12°E: Austria; Belgium; Denmark - onshore and offshore; Germany - onshore and offshore; Norway including - onshore and offshore; Spain - offshore.
- bounds: (6.0, 38.76, 12.0, 84.33)
Coordinate Operation:
- name: UTM zone 32N
- method: Transverse Mercator
Datum: European Terrestrial Reference System 1989 ensemble
- Ellipsoid: GRS 1980
- Prime Meridian: Greenwich


berlin_district = gpd.read_file(
    "http://userpage.fu-berlin.de/soga/soga-py/300/30800_spatial_point_patterns/berlin_district.zip"
)


berlin_district.plot(figsize=(12, 5), color="red")

plt.show()


# find bounds of geodataframe
x_min, y_min, x_max, y_max = berlin_district.total_bounds


# set seed for reproducibility
random.seed(1111)

# set sample size
n = round(berlin_locations.shape[0] * 0.4)

## generate random uniform numbers
x_random = np.random.uniform(x_min, x_max, n)
y_random = np.random.uniform(y_min, y_max, n)


# convert to GeoSeries
random_points = gpd.GeoSeries(gpd.points_from_xy(x_random, y_random))
# only keep those points within berlin_district
berlin_random = random_points[random_points.within(berlin_district.unary_union)]


fig, ax = plt.subplots(figsize=(10, 5))
berlin_district.plot(ax=ax, edgecolor="darkblue", linewidth=1, color="white")
berlin_random.plot(
    ax=ax,
    edgecolor="black",
    color="lightgrey",
)
plt.title("Random Points")

plt.show()


n = round(np.sqrt(berlin_locations.shape[0]) * 0.35)
x_regular = np.linspace(x_min, x_max, n)
y_regular = np.linspace(y_min, y_max, n)


xx = np.meshgrid(x_regular, y_regular)[0].flatten()
yy = np.meshgrid(x_regular, y_regular)[1].flatten()


random_points = gpd.GeoSeries(gpd.points_from_xy(xx, yy))

## cut to size
berlin_regular = random_points[random_points.within(berlin_district.unary_union)]


fig, ax = plt.subplots(figsize=(10, 5))
berlin_district.plot(ax=ax, edgecolor="darkblue", linewidth=1, color="white")
berlin_regular.plot(
    ax=ax,
    edgecolor="black",
    color="lightgrey",
)
plt.title("Regular Points")

plt.show()


## Writing to Shapefile:

berlin_random.to_file("../data/berlin_random.shp")

## Writing to GeoJSON:

berlin_random.to_file("../data/berlin_random.geojson", driver="GeoJSON")


## Writing to GeoJSON:

berlin_locations.to_file("../data/berlin_locations.geojson", driver="GeoJSON")

berlin_regular.to_file("../data/berlin_regular.geojson", driver="GeoJSON")

The `GeoPandas` package¶

Re-Projecting¶

Regular spaced and random data¶

Random points¶

Regular points¶

Writing Spatial Data¶

	osm_id	code	fclass	name	geometry
0	16541597	2907	camera_surveillance	Aral	POINT (13.34544 52.54644)
1	26735749	2301	restaurant	Aida	POINT (13.32282 52.50691)
2	26735753	2006	telephone	None	POINT (13.32214 52.50645)
3	26735759	2301	restaurant	Madame Ngo	POINT (13.31808 52.50621)
4	26735763	2301	restaurant	Thanh Long	POINT (13.32078 52.50732)

The GeoPandas package¶

Re-Projecting¶

Regular spaced and random data¶

Random points¶

Regular points¶

Writing Spatial Data¶

The `GeoPandas` package¶