import glob                       # File paths
import pandas as pd               # Tables
import shapely.geometry           # Vector geometries
import geopandas as gpd           # Vector layers
import seaborn as sns             # Plots (Heatmap)
import networkx as nx             # Network analysis
import networkx.algorithms        # Network analysis (community detection)
import textblob                   # Sentiment analysis

/home/michael/.local/lib/python3.8/site-packages/geopandas/_compat.py:111: UserWarning: The Shapely GEOS version (3.8.0-CAPI-1.13.1 ) is incompatible with the GEOS version PyGEOS was compiled with (3.10.1-CAPI-1.16.0). Conversions between both will be slow.
  warnings.warn(


import matplotlib.pyplot as plt
pd.options.display.max_rows = 6
pd.options.display.max_columns = 8
pd.options.display.max_colwidth = 35
plt.rcParams["figure.figsize"] = (18, 8)


%%html
<style>
.dataframe td {
    white-space: nowrap;
}
</style>


files = glob.glob("data/boston_*_2022-03-11*.json")
files.sort()
files

['data/boston_geobgu_2022-03-11_00:00:02.json',
 'data/boston_geobgu_2022-03-11_01:00:01.json',
 'data/boston_geobgu_2022-03-11_02:00:01.json',
 'data/boston_geobgu_2022-03-11_03:00:02.json',
 'data/boston_geobgu_2022-03-11_04:00:02.json',
 'data/boston_geobgu_2022-03-11_05:00:02.json',
 'data/boston_geobgu_2022-03-11_06:00:02.json',
 'data/boston_geobgu_2022-03-11_07:00:00.json',
 'data/boston_geobgu_2022-03-11_08:00:02.json',
 'data/boston_geobgu_2022-03-11_09:00:02.json',
 'data/boston_geobgu_2022-03-11_10:00:01.json',
 'data/boston_geobgu_2022-03-11_11:00:02.json',
 'data/boston_geobgu_2022-03-11_12:00:02.json',
 'data/boston_geobgu_2022-03-11_13:00:01.json',
 'data/boston_geobgu_2022-03-11_14:00:02.json',
 'data/boston_geobgu_2022-03-11_15:00:00.json',
 'data/boston_geobgu_2022-03-11_16:00:00.json',
 'data/boston_geobgu_2022-03-11_17:00:02.json',
 'data/boston_geobgu_2022-03-11_18:00:02.json',
 'data/boston_geobgu_2022-03-11_19:00:01.json',
 'data/boston_geobgu_2022-03-11_20:00:00.json',
 'data/boston_geobgu_2022-03-11_21:00:02.json',
 'data/boston_geobgu_2022-03-11_22:00:02.json',
 'data/boston_geobgu_2022-03-11_23:00:00.json']


dat = []
for i in files:
    tmp = pd.read_json(i, lines=True)
    dat.append(tmp)
dat = pd.concat(dat, axis=0)
dat = dat.sort_values("created_at")
dat = dat.reset_index(drop=True)
dat


vars = ["created_at", "user", "coordinates", "text", "lang"]
dat = dat[vars].copy()
dat


dat["created_at"]

0      2022-03-10 21:59:58+00:00
1      2022-03-10 22:00:03+00:00
2      2022-03-10 22:00:06+00:00
                  ...           
1769   2022-03-11 21:59:20+00:00
1770   2022-03-11 21:59:20+00:00
1771   2022-03-11 21:59:25+00:00
Name: created_at, Length: 1772, dtype: datetime64[ns, UTC]


dat["created_at"] = dat["created_at"].dt.tz_convert("US/Eastern")
dat["created_at"]

0      2022-03-10 16:59:58-05:00
1      2022-03-10 17:00:03-05:00
2      2022-03-10 17:00:06-05:00
                  ...           
1769   2022-03-11 16:59:20-05:00
1770   2022-03-11 16:59:20-05:00
1771   2022-03-11 16:59:25-05:00
Name: created_at, Length: 1772, dtype: datetime64[ns, US/Eastern]


dat["created_at"].min()

Timestamp('2022-03-10 16:59:58-0500', tz='US/Eastern')


dat["created_at"].max()

Timestamp('2022-03-11 16:59:25-0500', tz='US/Eastern')


dat["created_at"].max() - dat["created_at"].min()

Timedelta('0 days 23:59:27')


sel = dat["created_at"] > pd.to_datetime("2022-03-10 17:00:00-05:00")
dat = dat[sel].reset_index()
dat


dat["coordinates"]

0       {'type': 'Point', 'coordinates'...
1       {'type': 'Point', 'coordinates'...
2       {'type': 'Point', 'coordinates'...
                       ...                
1768    {'type': 'Point', 'coordinates'...
1769    {'type': 'Point', 'coordinates'...
1770    {'type': 'Point', 'coordinates'...
Name: coordinates, Length: 1771, dtype: object


x = dat["coordinates"].iloc[0]
x

{'type': 'Point', 'coordinates': [-70.85783, 42.5001]}


type(x)

dict


shapely.geometry.shape(x)


geom = gpd.GeoSeries([shapely.geometry.shape(i) for i in dat["coordinates"]], crs=4326)
geom

0       POINT (-70.85783 42.50010)
1       POINT (-78.57028 43.05667)
2       POINT (-70.88977 42.24177)
                   ...            
1768    POINT (-71.05573 41.90565)
1769    POINT (-71.47789 41.99340)
1770    POINT (-71.03487 42.34709)
Length: 1771, dtype: geometry


pnt = gpd.GeoDataFrame(dat, geometry=geom, crs=4326)
pnt = pnt.drop(["coordinates"], axis=1)
pnt


pnt.plot();

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4f248b20>


bb = shapely.geometry.box(-72.21437, 41.19034, -69.64939, 43.30924)
bb


base = pnt.plot()
gpd.GeoSeries(bb).plot(ax=base, color="None", edgecolor="black");

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4f0c64f0>


pnt = pnt[pnt.intersects(bb)].copy()
pnt


base = pnt.plot()
gpd.GeoSeries(bb).plot(ax=base, color="None", edgecolor="black");

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4eb01610>


borders = gpd.read_file("data/borders.shp")


base = pnt.plot()
borders.plot(ax=base, color="None", edgecolor="lightgrey")
gpd.GeoSeries(bb).plot(ax=base, color="None", edgecolor="black");

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4f1f6430>


pnt["hour"] = pnt["created_at"].dt.strftime("%m-%d %H")
pnt["hour"]

0       03-10 17
2       03-10 17
3       03-10 17
          ...   
1768    03-11 16
1769    03-11 16
1770    03-11 16
Name: hour, Length: 1125, dtype: object


pnt["hour"].value_counts().sort_index().plot.bar();

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4f147eb0>


pnt = gpd.sjoin(pnt, borders)
pnt


pnt[["hour", "NAME_2"]]


tab = pd.crosstab(pnt["NAME_2"], pnt["hour"])
tab

tab


sns.heatmap(tab, annot=True);

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4e48b370>


pnt["user"].iloc[0]

{'id': 2202066812,
 'id_str': '2202066812',
 'name': "5 O'Clock Somewhere",
 'screen_name': '5oclockbot',
 'location': None,
 'url': None,
 'description': "Follow us to know when it's time for a drink. @bugloaf made me.",
 'translator_type': 'none',
 'protected': False,
 'verified': False,
 'followers_count': 1929,
 'friends_count': 1,
 'listed_count': 73,
 'favourites_count': 0,
 'statuses_count': 74596,
 'created_at': 'Mon Nov 18 22:17:15 +0000 2013',
 'utc_offset': None,
 'time_zone': None,
 'geo_enabled': True,
 'lang': None,
 'contributors_enabled': False,
 'is_translator': False,
 'profile_background_color': 'C0DEED',
 'profile_background_image_url': 'http://abs.twimg.com/images/themes/theme1/bg.png',
 'profile_background_image_url_https': 'https://abs.twimg.com/images/themes/theme1/bg.png',
 'profile_background_tile': False,
 'profile_link_color': '1DA1F2',
 'profile_sidebar_border_color': 'C0DEED',
 'profile_sidebar_fill_color': 'DDEEF6',
 'profile_text_color': '333333',
 'profile_use_background_image': True,
 'profile_image_url': 'http://pbs.twimg.com/profile_images/378800000758913040/36090d99f2f5c78d26677c0bcb990b18_normal.jpeg',
 'profile_image_url_https': 'https://pbs.twimg.com/profile_images/378800000758913040/36090d99f2f5c78d26677c0bcb990b18_normal.jpeg',
 'default_profile': True,
 'default_profile_image': False,
 'following': None,
 'follow_request_sent': None,
 'notifications': None,
 'withheld_in_countries': []}


pnt["user"] = [i["screen_name"] for i in pnt["user"]]
pnt


routes = pnt.groupby(["user"]).agg({"geometry": lambda x: x.tolist()}).reset_index()
routes


routes["n"] = [len(i) for i in routes["geometry"]]
routes


routes["n"].value_counts().plot(kind="bar");

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4a9aa790>


routes = routes[routes["n"] > 1].reset_index(drop=True)
routes


routes["geometry"] = gpd.GeoSeries([shapely.geometry.LineString(i) for i in routes["geometry"]])
routes = gpd.GeoDataFrame(routes, crs=4326)
routes


base = routes.plot()
borders.plot(ax=base, color="None", edgecolor="lightgrey")
gpd.GeoSeries(bb).plot(ax=base, color="None", edgecolor="black");

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4aa047c0>


friends = pd.read_csv("data/network.csv", sep = "\t", header=None, usecols=[0, 1], names=["from", "to"])
friends


sel = friends["to"].isin(friends["from"])
friends = friends[sel].reset_index(drop=True)
friends


locations = pd.read_csv("data/locations.csv")
locations


# gcp = gpd.tools.geocode(locations["address"], provider="nominatim", user_agent="michael", timeout=4)
# gcp["address"] = locations["address"]
# gcp = gcp.drop_duplicates()
# gcp.to_file("data/gcp.shp")
gcp = gpd.read_file("data/gcp.shp")
gcp


world = gpd.read_file(gpd.datasets.get_path("naturalearth_lowres"))
world = world[["name", "geometry"]]
world.plot();

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4e45ffd0>


base = world.plot(color="None", edgecolor="grey")
world[world.intersects(gcp.unary_union)].plot(ax=base, color="grey", edgecolor="black")
gcp.plot(ax=base, color="red");

<matplotlib.axes._subplots.AxesSubplot at 0x7fac4f7c4250>


gcp = gpd.sjoin(gcp, world, how="left")
gcp


locations = pd.merge(locations, gcp[["address", "name"]], how="left").drop(["address"], axis=1)
locations


friends = friends.rename(columns={"from":"user"}).merge(locations, how="inner").rename(columns={"name":"from"}).drop(["user"], axis=1)
friends = friends.rename(columns={"to":"user"}).merge(locations, how="inner").rename(columns={"name":"to"}).drop(["user"], axis=1)
friends


friends = friends.dropna().copy()
friends


friends["count"] = 1
friends = friends.groupby(["from", "to"]).sum().reset_index()
friends


G = nx.from_pandas_edgelist(friends, "from", "to", create_using=nx.DiGraph(), edge_attr="count")
G

<networkx.classes.digraph.DiGraph at 0x7fac4ab9c700>


list(G.nodes)

['Australia',
 'Austria',
 'Belgium',
 'Canada',
 'Denmark',
 'France',
 'Germany',
 'Ireland',
 'Italy',
 'Netherlands',
 'New Zealand',
 'Romania',
 'Spain',
 'Switzerland',
 'Tanzania',
 'Ukraine',
 'United Kingdom',
 'United States of America',
 'Finland',
 'Japan',
 'Venezuela',
 'India',
 'Thailand',
 'Israel',
 'China']


len(list(G.nodes))

25


list(G.edges.data())[:10]

[('Australia', 'Australia', {'count': 8}),
 ('Australia', 'Austria', {'count': 5}),
 ('Australia', 'Belgium', {'count': 1}),
 ('Australia', 'Canada', {'count': 6}),
 ('Australia', 'Denmark', {'count': 1}),
 ('Australia', 'France', {'count': 5}),
 ('Australia', 'Germany', {'count': 6}),
 ('Australia', 'Ireland', {'count': 1}),
 ('Australia', 'Italy', {'count': 1}),
 ('Australia', 'Netherlands', {'count': 4})]


len(list(G.edges))

264


pos = nx.kamada_kawai_layout(G)
nx.draw(G, pos, with_labels=True)


weights = nx.get_edge_attributes(G,"count").values()
weights = list(weights)
weights[:10]

[8, 5, 1, 6, 1, 5, 6, 1, 1, 4]


pos = nx.kamada_kawai_layout(G)
nx.draw(G, pos, with_labels=True, width=[i/50 for i in weights])


nx.density(G)

0.44


nx.number_connected_components(G.to_undirected())

1


i = list(G.nodes)[0]
i

'Australia'


list(world[world["name"] == i]["geometry"].iloc[0].centroid.coords)

[(134.50277547536595, -25.730654779726077)]


pos = [list(world[world["name"] == i]["geometry"].iloc[0].centroid.coords)[0] for i in list(G.nodes)]
pos = dict(zip(list(G.nodes), pos))
pos

{'Australia': (134.50277547536595, -25.730654779726077),
 'Austria': (14.076158884337072, 47.6139487927463),
 'Belgium': (4.580834113854935, 50.65244095902296),
 'Canada': (-98.14238137209708, 61.46907614534896),
 'Denmark': (9.876372937675002, 56.06393446179454),
 'France': (-2.8766966992706267, 42.46070432663372),
 'Germany': (10.288485092742851, 51.13372269040778),
 'Ireland': (-8.010236544877012, 53.18059120995006),
 'Italy': (12.140788372235871, 42.751183052964265),
 'Netherlands': (5.512217100965399, 52.298700374441786),
 'New Zealand': (172.70192594405574, -41.662578757158684),
 'Romania': (24.943252494635377, 45.857101035738005),
 'Spain': (-3.6170206023873743, 40.348656106226734),
 'Switzerland': (8.118300613385486, 46.79173768366762),
 'Tanzania': (34.75298985475595, -6.257732428506092),
 'Ukraine': (31.229122070266495, 49.14882260840351),
 'United Kingdom': (-2.8531353951805545, 53.91477348053706),
 'United States of America': (-112.5994359115045, 45.70562800215178),
 'Finland': (26.211764610296353, 64.50409403963651),
 'Japan': (138.06496213270776, 37.66311081170466),
 'Venezuela': (-66.16382727830238, 7.162132267639002),
 'India': (79.59370376325381, 22.92500640740852),
 'Thailand': (101.00613354626108, 15.01697499141648),
 'Israel': (35.003851206429005, 31.4849193900197),
 'China': (103.88361230063249, 36.555066531858685)}


base = world.plot(color="None", edgecolor="lightgrey")
nx.draw(G, pos, ax=base, with_labels=True, width=[i/50 for i in weights])


d = G.degree(weight="count")
d

DiDegreeView({'Australia': 180, 'Austria': 104, 'Belgium': 27, 'Canada': 294, 'Denmark': 83, 'France': 266, 'Germany': 237, 'Ireland': 39, 'Italy': 28, 'Netherlands': 125, 'New Zealand': 55, 'Romania': 26, 'Spain': 99, 'Switzerland': 52, 'Tanzania': 38, 'Ukraine': 28, 'United Kingdom': 796, 'United States of America': 2864, 'Finland': 29, 'Japan': 6, 'Venezuela': 42, 'India': 14, 'Thailand': 16, 'Israel': 221, 'China': 1})


sizes = list(dict(d).values())
base = world.plot(color="None", edgecolor="lightgrey")
nx.draw(G, pos, ax=base, with_labels=True, width=[i/50 for i in weights], node_size=sizes)


list(networkx.algorithms.community.greedy_modularity_communities(G))

[frozenset({'Australia',
            'Canada',
            'Denmark',
            'France',
            'Germany',
            'Ireland',
            'New Zealand',
            'Spain',
            'Switzerland',
            'United Kingdom'}),
 frozenset({'China',
            'Finland',
            'India',
            'Israel',
            'Thailand',
            'Ukraine',
            'United States of America',
            'Venezuela'}),
 frozenset({'Austria',
            'Belgium',
            'Italy',
            'Japan',
            'Netherlands',
            'Romania',
            'Tanzania'})]


text = [
    "I'm happy", 
    "I'm sad...",
    "I'm very happy!", 
    "I'm not happy"
]


[(i, textblob.TextBlob(i).sentiment.polarity) for i in text]

[("I'm happy", 0.8),
 ("I'm sad...", -0.5),
 ("I'm very happy!", 1.0),
 ("I'm not happy", -0.4)]


pnt1 = pnt[pnt["lang"] == "en"].copy()
pnt1


pnt1["polarity"] = [textblob.TextBlob(i).sentiment.polarity for i in pnt1["text"]]
pnt1


pnt1[["text", "polarity"]].sort_values(by="polarity").head()["text"].tolist()

['19:07 WC1N (Robert) on W1/HA-009 (Monadnock Mountain, 967m, 4 pts) 14.0590 CW: [RBNHole] at KM3T 18 WPM 3 dB SNR [RBNHOLE]',
 'Tobias Harris has the worst contract in the league. God damn he sucks.',
 'Random #bunkerhill timelapse clip of the day! #charlestown #boston @bostonNHP https://t.co/qf3n1NGtW7',
 'Random #southie timelapse clip of the day! #boston #dorchesterheights @bostonNHP https://t.co/uxOnUU7QZW',
 'Just posted a photo @ Cold Harbor Brewing Company https://t.co/kf7QG5cOsi']


pnt1[["text", "polarity"]].sort_values(by="polarity", ascending=False).head()["text"].tolist()

['The great Max Jordan turns 18 today!\nMiraculous! @ Providence, Rhode Island https://t.co/p2DXNrRKDU',
 'Career tip for landing jobs like "Sanitation" in #Braintree, MA. Go on informational interviews. The best way to ge… https://t.co/XPqLodsb7B',
 'Excellent flavor. - Drinking a Letter To Robert Fripp by @CamBrewingCo at @cambridgebrewer  — https://t.co/tR4VtNBBHg',
 'At Hawthorn Senior Living we care about people and because our residents deserve the best. If you are someone who u… https://t.co/XUxU1vfI9H',
 'Our delicious FIsh Stew tonight. #fishstew #fishfriday #fishandchips #bakedschrod #grilledsalmon  #allovernewton… https://t.co/wMDs5Nz2x1']


pnt1.plot(column="polarity", legend=True);

<matplotlib.axes._subplots.AxesSubplot at 0x7fac40e28430>

	created_at	id	id_str	text	...	quoted_status_id	quoted_status_id_str	quoted_status	quoted_status_permalink
0	2022-03-10 21:59:58+00:00	1502041600670650368	1502041600670650368	Looking for a new opportunity a...	...	NaN	NaN	NaN	NaN
1	2022-03-10 22:00:03+00:00	1502041619343810560	1502041619343810560	It's 5 o'clock in Marblehead.	...	NaN	NaN	NaN	NaN
2	2022-03-10 22:00:06+00:00	1502041631851167750	1502041631851167744	Wind 0 mph -. Barometer 30.10 i...	...	NaN	NaN	NaN	NaN
...	...	...	...	...	...	...	...	...	...
1769	2022-03-11 21:59:20+00:00	1502403827588231170	1502403827588231168	See our latest #Raynham, MA Pha...	...	NaN	NaN	NaN	NaN
1770	2022-03-11 21:59:20+00:00	1502403825658851328	1502403825658851328	Help pave the path to equitable...	...	NaN	NaN	NaN	NaN
1771	2022-03-11 21:59:25+00:00	1502403847368675328	1502403847368675328	I'm at Harpoon Brewery in Bosto...	...	NaN	NaN	NaN	NaN

	index	created_at	user	text	...	index_right	NAME_0	NAME_1	NAME_2
0	1	2022-03-10 17:00:03-05:00	{'id': 2202066812, 'id_str': '2...	It's 5 o'clock in Marblehead.	...	7	United States	Massachusetts	Essex
18	19	2022-03-10 17:03:37-05:00	{'id': 65386810, 'id_str': '653...	Spring is in the air. 🌼 🌸 🌻 🌹 @...	...	7	United States	Massachusetts	Essex
59	60	2022-03-10 17:25:41-05:00	{'id': 188856838, 'id_str': '18...	Want to land a job like "Delive...	...	7	United States	Massachusetts	Essex
...	...	...	...	...	...	...	...	...	...
1386	1387	2022-03-11 14:07:33-05:00	{'id': 61220731, 'id_str': '612...	19:07 WC1N (Robert) on W1/HA-00...	...	17	United States	New Hampshire	Cheshire
1389	1390	2022-03-11 14:09:32-05:00	{'id': 61220731, 'id_str': '612...	19:09 WC1N (Robert) on W1/HA-00...	...	17	United States	New Hampshire	Cheshire
1401	1402	2022-03-11 14:15:28-05:00	{'id': 61220731, 'id_str': '612...	19:15 WC1N (Robert) on W1/HA-00...	...	17	United States	New Hampshire	Cheshire

	hour	NAME_2
0	03-10 17	Essex
18	03-10 17	Essex
59	03-10 17	Essex
...	...	...
1386	03-11 14	Cheshire
1389	03-11 14	Cheshire
1401	03-11 14	Cheshire

	user	geometry
0	2communique	[POINT (-71.52953383000001 42.3...
1	511NY	[POINT (-71.894361 41.718893), ...
2	5oclockbot	[POINT (-70.85783000000001 42.5...
...	...	...
487	yaratrv	[POINT (-71.0565 42.3577)]
488	yokomiwa	[POINT (-71.08696908 42.34674)]
489	zumescoffee	[POINT (-71.06542 42.3766)]

	user	geometry	n
0	2communique	[POINT (-71.52953383000001 42.3...	1
1	511NY	[POINT (-71.894361 41.718893), ...	2
2	5oclockbot	[POINT (-70.85783000000001 42.5...	1
...	...	...	...
487	yaratrv	[POINT (-71.0565 42.3577)]	1
488	yokomiwa	[POINT (-71.08696908 42.34674)]	1
489	zumescoffee	[POINT (-71.06542 42.3766)]	1

Aim¶

Requirements¶

Contents¶

Part I: Introduction¶

Types of LBSN data¶

Twitter APIs¶

Part II: Practical Examples¶

Example 1: Setting up Twitter account¶

Example 2: Collecting tweets¶

Example 3: Analyzing spatial patterns¶

LBSN research applications (1)¶

LBSN research applications (2)¶

LBSN research applications (3)¶

Example 4: Collecting network data¶

Example 5: Network analysis¶

LBSN research applications (4)¶

LBSN research applications (5)¶

Example 6: Sentiment analysis¶

LBSN research applications (6)¶

LBSN research applications (7)¶

Summary—Software Tools¶

Thank you for listening!¶

	created_at	user	coordinates	text	lang
0	2022-03-10 21:59:58+00:00	{'id': 173349856, 'id_str': '17...	{'type': 'Point', 'coordinates'...	Looking for a new opportunity a...	en
1	2022-03-10 22:00:03+00:00	{'id': 2202066812, 'id_str': '2...	{'type': 'Point', 'coordinates'...	It's 5 o'clock in Marblehead.	en
2	2022-03-10 22:00:06+00:00	{'id': 217362857, 'id_str': '21...	{'type': 'Point', 'coordinates'...	Wind 0 mph -. Barometer 30.10 i...	en
...	...	...	...	...	...
1769	2022-03-11 21:59:20+00:00	{'id': 107912849, 'id_str': '10...	{'type': 'Point', 'coordinates'...	See our latest #Raynham, MA Pha...	en
1770	2022-03-11 21:59:20+00:00	{'id': 114312080, 'id_str': '11...	{'type': 'Point', 'coordinates'...	Help pave the path to equitable...	en
1771	2022-03-11 21:59:25+00:00	{'id': 294758966, 'id_str': '29...	{'type': 'Point', 'coordinates'...	I'm at Harpoon Brewery in Bosto...	en

hour	03-10 17	03-10 18	03-10 19	03-10 20	...	03-11 13	03-11 14	03-11 15	03-11 16
NAME_2
Barnstable	1	0	0	0	...	0	0	1	1
Bristol	1	4	2	5	...	2	3	3	2
Cheshire	0	0	0	0	...	2	4	0	0
...	...	...	...	...	...	...	...	...	...
Windham	0	0	0	0	...	1	0	2	0
Worcester	4	1	4	1	...	10	5	2	8
York	0	0	0	0	...	2	0	1	1

	user	geometry	n
0	511NY	[POINT (-71.894361 41.718893), ...	2
1	ACutAboveHair	[POINT (-72.1469 41.3497), POIN...	2
2	Aescano	[POINT (-71.062258 42.325208), ...	3
...	...	...	...
171	tmj_usa_prod	[POINT (-71.4778902 41.9933953)...	2
172	true2theyanks	[POINT (-71.0565 42.3577), POIN...	2
173	yankh8tr	[POINT (-72.0166321 42.139492),...	2

	user	geometry	n
0	511NY	LINESTRING (-71.89436 41.71889,...	2
1	ACutAboveHair	LINESTRING (-72.14690 41.34970,...	2
2	Aescano	LINESTRING (-71.06226 42.32521,...	3
...	...	...	...
171	tmj_usa_prod	LINESTRING (-71.47789 41.99340,...	2
172	true2theyanks	LINESTRING (-71.05650 42.35770,...	2
173	yankh8tr	LINESTRING (-72.01663 42.13949,...	2

	from	to
0	MichaelDorman84	ireneros
1	ireneros	fdo_becerra
2	ireneros	KAUST_Vislab
...	...	...
86855	therealguypines	guyoseary
86856	therealguypines	RyanSeacrest
86857	therealguypines	TheEllenShow

	user	address
0	d3visualization	Montreal
1	sckottie	OR
2	mdsumner	Hobart, Tasmania
...	...	...
188	clavitolo	Reading, United Kingdom
189	noamross	Brooklyn/Hudson Yards, NY
190	locweb	Perth, Western Australia

	address	geometry
0	Montreal	POINT (-73.56981 45.50318)
1	OR	POINT (-120.73726 43.97928)
2	Hobart, Tasmania	POINT (147.32812 -42.88251)
...	...	...
146	Reading, United Kingdom	POINT (-0.96965 51.45666)
147	Brooklyn/Hudson Yards, NY	POINT (-73.99645 40.75608)
148	Perth, Western Australia	POINT (115.86058 -31.95590)

	address	geometry	index_right	name
0	Montreal	POINT (-73.56981 45.50318)	3.0	Canada
1	OR	POINT (-120.73726 43.97928)	4.0	United States of America
2	Hobart, Tasmania	POINT (147.32812 -42.88251)	137.0	Australia
...	...	...	...	...
146	Reading, United Kingdom	POINT (-0.96965 51.45666)	143.0	United Kingdom
147	Brooklyn/Hudson Yards, NY	POINT (-73.99645 40.75608)	4.0	United States of America
148	Perth, Western Australia	POINT (115.86058 -31.95590)	137.0	Australia

	from	to
0	Israel	United States of America
1	United States of America	United States of America
2	United Kingdom	United States of America
...	...	...
3832	United States of America	Israel
3833	Israel	Israel
3834	United States of America	Israel

Analysis of Data from Location-Based Social Networks (LBSN)¶

Aim¶

Requirements¶

Contents¶

Part I: Introduction¶

Location-Based Social Networks (LBSN)¶

Types of LBSN data¶

Twitter APIs¶

Part II: Practical Examples¶

Example 1: Setting up Twitter account¶

Example 2: Collecting tweets¶

Example 3: Analyzing spatial patterns¶

LBSN research applications (1)¶

LBSN research applications (2)¶

LBSN research applications (3)¶

Example 4: Collecting network data¶

Example 5: Network analysis¶

LBSN research applications (4)¶

LBSN research applications (5)¶

Example 6: Sentiment analysis¶

LBSN research applications (6)¶

LBSN research applications (7)¶

Summary—Software Tools¶

Thank you for listening!¶