{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "initial_id", "metadata": { "collapsed": true, "ExecuteTime": { "end_time": "2023-11-07T18:15:48.594817Z", "start_time": "2023-11-07T18:15:47.605833Z" } }, "outputs": [], "source": [ "import pandas as pd\n", "import folium\n", "import utils" ] }, { "cell_type": "code", "execution_count": 2, "outputs": [], "source": [ "# Load the data\n", "ListA = pd.read_csv('List A.csv')\n", "ListB = pd.read_csv('List B.csv')\n", "ListC = pd.read_csv('List C.csv')\n", "ListD = pd.read_csv('List D.csv')" ], "metadata": { "collapsed": false, "ExecuteTime": { "end_time": "2023-11-07T18:15:48.604219Z", "start_time": "2023-11-07T18:15:48.596141Z" } }, "id": "73b780e762c9de37" }, { "cell_type": "code", "execution_count": 3, "outputs": [], "source": [ "# Create three centroids, one in the North End, one in the Financial District, and one in the Back Bay\n", "centroids = [[42.364506, -71.054733], [42.358894, -71.056742], [42.3505, -71.0760]]\n", "\n", "northeastern_coordinate = \"-71.09033,42.33976\"" ], "metadata": { "collapsed": false, "ExecuteTime": { "end_time": "2023-11-07T18:15:48.608755Z", "start_time": "2023-11-07T18:15:48.604788Z" } }, "id": "be4c8c1d77842ef7" }, { "cell_type": "code", "execution_count": 4, "outputs": [], "source": [ "# Combine the two lists and add a column to indicate the list\n", "ListA['list'] = 'A'\n", "ListB['list'] = 'B'\n", "ListC['list'] = 'C'\n", "ListD['list'] = 'D'\n", "\n", "TotalList = pd.concat([ListA, ListB, ListC, ListD])" ], "metadata": { "collapsed": false, "ExecuteTime": { "end_time": "2023-11-07T18:15:48.613233Z", "start_time": "2023-11-07T18:15:48.607380Z" } }, "id": "ffe4025e97a6c6b9" }, { "cell_type": "code", "execution_count": 5, "outputs": [], "source": [ "# Remove all columns but name and gps\n", "TotalList = TotalList[['name', 'gps', 'list']]" ], "metadata": { "collapsed": false, "ExecuteTime": { "end_time": "2023-11-07T18:15:48.613309Z", "start_time": "2023-11-07T18:15:48.611827Z" } }, "id": "72657779b4484aae" }, { "cell_type": "code", "execution_count": 6, "outputs": [], "source": [ "# Convert the gps column to a list of lists for k-means\n", "TotalList['gps'] = TotalList['gps'].apply(lambda x: x.strip('[]').split(','))\n", "TotalList['gps'] = TotalList['gps'].apply(lambda x: [float(i) for i in x])" ], "metadata": { "collapsed": false, "ExecuteTime": { "end_time": "2023-11-07T18:15:48.617922Z", "start_time": "2023-11-07T18:15:48.614428Z" } }, "id": "a157ffaec020a29a" }, { "cell_type": "code", "execution_count": 7, "outputs": [ { "data": { "text/plain": " name gps list \\\n0 521 Commercial Street #525 [42.3688272, -71.0553792] A \n1 Acorn St [42.3576234, -71.0688746] A \n2 Arlington's Great Meadows [42.4299758, -71.2038948] A \n3 Arthur Fiedler Statue [42.3565057, -71.0754527] A \n4 BU Beach [42.3511927, -71.1060828] A \n.. ... ... ... \n33 The Quiet Few [42.3670906, -71.0359889] D \n34 The Tall Ship Boston [42.3649544, -71.0414523] D \n35 Toasted Flats [42.3711266, -71.0371343] D \n36 Vega Market [42.3891835, -71.033703] D \n37 Winthrop High School [42.3803348, -70.9799864] D \n\n normalized_gps \n0 [0.7251058917247415, 0.7797482353989729] \n1 [0.6747391031099019, 0.7451825969538083] \n2 [1.0, 0.3993566550776867] \n3 [0.6697144722136962, 0.7283341725828262] \n4 [0.6458298305822171, 0.6498815915448888] \n.. ... \n33 [0.717298990038831, 0.8294124246148072] \n34 [0.7076956827824702, 0.8154190706511427] \n35 [0.7354428661210094, 0.8264787225922622] \n36 [0.8166178304491644, 0.8352672783369615] \n37 [0.7768384161061446, 0.972851090162032] \n\n[169 rows x 4 columns]", "text/html": "
| \n | name | \ngps | \nlist | \nnormalized_gps | \n
|---|---|---|---|---|
| 0 | \n521 Commercial Street #525 | \n[42.3688272, -71.0553792] | \nA | \n[0.7251058917247415, 0.7797482353989729] | \n
| 1 | \nAcorn St | \n[42.3576234, -71.0688746] | \nA | \n[0.6747391031099019, 0.7451825969538083] | \n
| 2 | \nArlington's Great Meadows | \n[42.4299758, -71.2038948] | \nA | \n[1.0, 0.3993566550776867] | \n
| 3 | \nArthur Fiedler Statue | \n[42.3565057, -71.0754527] | \nA | \n[0.6697144722136962, 0.7283341725828262] | \n
| 4 | \nBU Beach | \n[42.3511927, -71.1060828] | \nA | \n[0.6458298305822171, 0.6498815915448888] | \n
| ... | \n... | \n... | \n... | \n... | \n
| 33 | \nThe Quiet Few | \n[42.3670906, -71.0359889] | \nD | \n[0.717298990038831, 0.8294124246148072] | \n
| 34 | \nThe Tall Ship Boston | \n[42.3649544, -71.0414523] | \nD | \n[0.7076956827824702, 0.8154190706511427] | \n
| 35 | \nToasted Flats | \n[42.3711266, -71.0371343] | \nD | \n[0.7354428661210094, 0.8264787225922622] | \n
| 36 | \nVega Market | \n[42.3891835, -71.033703] | \nD | \n[0.8166178304491644, 0.8352672783369615] | \n
| 37 | \nWinthrop High School | \n[42.3803348, -70.9799864] | \nD | \n[0.7768384161061446, 0.972851090162032] | \n
169 rows × 4 columns
\n| \n | waypoint_index | \ntrips_index | \nhint | \ndistance | \nname | \nlocation | \nlat | \nlon | \nroute | \n
|---|---|---|---|---|---|---|---|---|---|
| 0 | \n0 | \n0 | \nt4YsgAGHLIAAAAAAVQEAAAAAAAAwAAAAAAAAAHV0F0IAAA... | \n19.432511 | \n\n | [-71.054865, 42.364361] | \n-71.054865 | \n42.364361 | \n1 | \n
| 1 | \n1 | \n0 | \nIzYEgGw1BIASAAAArwAAADMAAACUAwAAynkIQGUkmkEXlL... | \n6.024489 | \n\n | [-71.055569, 42.364032] | \n-71.055569 | \n42.364032 | \n1 | \n
| 2 | \n2 | \n0 | \n5IgsgAqJLID7AAAAHgAAAAwAAAAIAAAAz5ffQcMBVEDFYK... | \n5.871835 | \n\n | [-71.055582, 42.365251] | \n-71.055582 | \n42.365251 | \n1 | \n
| 3 | \n3 | \n0 | \nG4gsgDiILICSAwAA5gAAAOkAAAAAAAAAQljLQnyXy0Fhy8... | \n2.602121 | \n\n | [-71.056164, 42.366918] | \n-71.056164 | \n42.366918 | \n1 | \n
| 4 | \n4 | \n0 | \ngIosgLaKLIDOAAAArgAAAFwBAAAAAAAAp3O3QafxmUEQiR... | \n15.458439 | \n\n | [-71.055561, 42.368861] | \n-71.055561 | \n42.368861 | \n1 | \n
| ... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
| 151 | \n62 | \n0 | \nlhgDgIkYA4BkAAAAIgEAAFoBAAAaAAAAJyAzQWNrAEI8Ax... | \n7.134933 | \n\n | [-71.083465, 42.34194] | \n-71.083465 | \n42.341940 | \n2 | \n
| 152 | \n63 | \n0 | \nMQwigFwMIoAoAAAANQAAABwAAAB-AAAAoidqQSAYl0GvUh... | \n11.504463 | \n\n | [-71.094327, 42.341231] | \n-71.094327 | \n42.341231 | \n2 | \n
| 153 | \n64 | \n0 | \nbwwigH0MIoAFAAAAEAAAAFUAAAArAAAAag0xP3921D-BFx... | \n8.340476 | \n\n | [-71.095003, 42.342001] | \n-71.095003 | \n42.342001 | \n2 | \n
| 154 | \n65 | \n0 | \nk4chgBiIIYAKAAAAFwAAAPQDAAB_AgAAHn2aP-biHUBi6e... | \n36.240351 | \n\n | [-71.093834, 42.339096] | \n-71.093834 | \n42.339096 | \n2 | \n
| 155 | \n66 | \n0 | \nDoUhgBeFIYCcAAAAJgAAAAAAAAARAAAAm0CKQdkZiEAAAA... | \n0.236958 | \nNortheastern (Inbound) | \n[-71.090331, 42.339762] | \n-71.090331 | \n42.339762 | \n2 | \n
156 rows × 9 columns
\n| \n | waypoint_index | \ntrips_index | \nhint | \ndistance | \nname | \nlocation | \nlat | \nlon | \nroute | \n
|---|---|---|---|---|---|---|---|---|---|
| 0 | \n0 | \n0 | \nt4YsgAGHLIAAAAAAVQEAAAAAAAAwAAAAAAAAAHV0F0IAAA... | \n19.432511 | \n\n | [-71.054865, 42.364361] | \n-71.054865 | \n42.364361 | \n1 | \n
| 1 | \n1 | \n0 | \ne1kugJlZLoBmAAAA6QAAAAAAAAAAAAAAZ6M2QSewzkEAAA... | \n4.756158 | \n\n | [-71.060933, 42.376178] | \n-71.060933 | \n42.376178 | \n1 | \n
| 2 | \n2 | \n0 | \ntFkugHVaLoAOAAAAAAAAABgAAAAAAAAAwMG2QAAAAAB6ii... | \n4.525535 | \n\n | [-71.060753, 42.376391] | \n-71.060753 | \n42.376391 | \n1 | \n
| 3 | \n3 | \n0 | \nsJAugLOQLoBuAQAAlAEAAAAAAAAAAAAAHFcjQvEZM0IAAA... | \n7.844897 | \n\n | [-71.060948, 42.380436] | \n-71.060948 | \n42.380436 | \n1 | \n
| 4 | \n4 | \n0 | \nVREtgNlJBIBCAAAAYAAAAAAAAAARAAAAOOzeQU7vHkIAAA... | \n22.681980 | \nFactory Street | \n[-71.061206, 42.398809] | \n-71.061206 | \n42.398809 | \n1 | \n
| ... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
| 170 | \n31 | \n0 | \ne38hgIUAA4C6AgAAGQAAAAAAAAAAAAAA_DybQoNdJUEAAA... | \n6.310267 | \nCarmel Street | \n[-71.100092, 42.332401] | \n-71.100092 | \n42.332401 | \n3 | \n
| 171 | \n32 | \n0 | \ng38hgI1_IYBOAAAAfwAAAAAAAAAAAAAAZ4ECQsbEUkIAAA... | \n12.789906 | \nTremont Street | \n[-71.098267, 42.332009] | \n-71.098267 | \n42.332009 | \n3 | \n
| 172 | \n33 | \n0 | \ncX8hgJF_IYA1AAAAMAAAAGcAAABOAAAATyWxQQ77nUEHMC... | \n22.776295 | \nAlleghany Street | \n[-71.099348, 42.33047] | \n-71.099348 | \n42.330470 | \n3 | \n
| 173 | \n34 | \n0 | \ns9QhgLbUIYAwAAAAkAAAAAAAAAAAAAAA2XmpQNgrgEEAAA... | \n4.111715 | \n\n | [-71.09454, 42.325354] | \n-71.094540 | \n42.325354 | \n3 | \n
| 174 | \n35 | \n0 | \nDoUhgBeFIYCcAAAAJgAAAAAAAAARAAAAm0CKQdkZiEAAAA... | \n0.236958 | \nNortheastern (Inbound) | \n[-71.090331, 42.339762] | \n-71.090331 | \n42.339762 | \n3 | \n
175 rows × 9 columns
\n