Tom Beer commited on
Commit
cb242b3
1 Parent(s): 6459725

add data files

Browse files
data.py CHANGED
@@ -38,20 +38,19 @@ hotel_id_to_review_map = get_hotel_id_to_review_map()
38
 
39
  def get_prompt(city, preferences) -> dict:
40
 
41
- score_threshold = score_threshold_per_city[city]
42
  for hotel_id in perm(city_to_hotel_id_map[city]):
43
  hotel_id = str(hotel_id)
44
  res = {"hotel_name": hotel_id_to_name_map[hotel_id], 'positive': [], 'negative': []}
45
- if hotel_id_to_review_map[hotel_id]['average_score'] >= score_threshold:
46
  hotel_reviews = hotel_id_to_review_map[hotel_id]['reviews']
47
- if len(hotel_reviews) > 100:
48
- for review in perm(hotel_reviews):
49
- if review['num_helpful'] > 10:
50
- if (review['score'] == 5) & (len(res['positive']) < 3):
51
- res['positive'].append(review)
52
- if (review['score'] <= 2) & (len(res['negative']) < 1):
53
- res['negative'].append(review)
54
- if (len(res['positive']) >= 3) & (len(res['negative']) >= 1):
55
- break
56
 
57
  return res
 
38
 
39
  def get_prompt(city, preferences) -> dict:
40
 
 
41
  for hotel_id in perm(city_to_hotel_id_map[city]):
42
  hotel_id = str(hotel_id)
43
  res = {"hotel_name": hotel_id_to_name_map[hotel_id], 'positive': [], 'negative': []}
44
+ try:
45
  hotel_reviews = hotel_id_to_review_map[hotel_id]['reviews']
46
+ except KeyError:
47
+ continue
48
+ for review in perm(hotel_reviews):
49
+ if (review['score'] == 5) & (len(res['positive']) < 3):
50
+ res['positive'].append(review)
51
+ if (review['score'] <= 2) & (len(res['negative']) < 1):
52
+ res['negative'].append(review)
53
+ if (len(res['positive']) >= 3) & (len(res['negative']) >= 1):
54
+ break
55
 
56
  return res
data/cmu/processed/cities.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["Boston", "Seattle", "San Jose", "Charlotte", "Chicago", "Washington DC", "Fort Worth", "Jacksonville", "Denver", "Los Angeles", "New York City", "Dallas", "Memphis", "Phoenix", "San Diego", "Austin", "Baltimore", "San Antonio", "Detroit", "Indianapolis", "San Francisco", "Houston", "Columbus", "Philadelphia", "El Paso"]
data/cmu/processed/city_to_hotel_id_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"Boston": [287606, 111418, 94368, 217546, 94363, 94372, 555224, 222957, 549445, 121009, 111441, 320038, 94326, 111422, 89602, 220216, 217550, 216999, 217000, 94354, 89619, 268206, 217148, 120977, 1138709, 222958, 499916, 77629, 89592, 126058, 94350, 89615, 1486034, 77638, 89620, 268205, 111428, 120988, 595373, 89568, 111416, 678412, 111423, 94399, 89599, 225873, 94367, 647006, 111417, 111444, 114150, 89600, 268207, 111434, 620703, 222955, 111421, 89617, 114149, 1201116, 321151, 313573, 1513541, 3225572, 1159285, 234752, 94344, 94371, 1136705, 94330, 114134, 89575, 94337, 89585, 258705], "Seattle": [123037, 123036, 100586, 100597, 72586, 124264, 100587, 100505, 100617, 1101223, 224865, 100554, 126402, 115754, 100570, 100610, 290883, 124269, 216847, 639072, 1147487, 1632900, 1633462, 1630818, 1635174, 1641958, 122985, 1648642, 595041, 122994, 100506, 100584, 100508, 112434, 100600, 3291041, 224860, 253306, 1130160, 224833, 606357, 100513, 224835, 2095177, 243759, 72598, 100531, 123032, 557193, 124270, 122998, 123029, 244041, 100577, 1630840, 100574, 100547, 281526, 100561, 223938, 223217, 124044, 217798, 100537, 100564, 100560, 100538, 123004, 123013, 224843, 578306, 100602, 100619, 217795, 223219, 72579, 258824, 275251, 123003, 268228, 100544, 112437, 124048, 100527, 100567, 100562, 239892, 100540, 123039, 100589, 1724250, 582371, 1174533, 224856, 115755, 281658, 100509, 217807, 123021, 252350, 100581, 72572, 677260, 1755673, 123022, 100585, 1200603, 224783, 112429, 281828, 100504, 614244, 100565, 100542, 1723585, 100569, 112412, 1152288, 613399, 1199588, 100507], "San Jose": [123562, 81703, 276205, 81708, 81710, 81659, 225252, 81662, 253314, 582475, 557214, 81688, 81653, 81691, 1017214, 1022963, 82283, 1645770, 81701, 1158718, 1147011, 1206216, 1142503, 81292, 81647, 81658, 81700, 225266, 1086739, 1528601, 267662, 81625, 239815, 631720, 81677, 119608, 82357, 225261, 119610, 82323, 654166, 82321, 82208, 119606, 119667, 81642, 81667, 81695, 287394, 82156, 223968, 81699, 81644, 240060, 82299, 81656, 324321, 81679, 225253, 223967, 82169, 81302, 81672, 81705, 226141, 82190, 256800, 225256, 119644, 1887026], "Charlotte": [1176230, 223203, 94166, 100566, 100599, 577342, 100568, 223916, 100637, 100559, 100870, 223210, 121868, 628474, 225335, 1593882, 3263526, 94130, 223374, 121862, 94097, 100607, 100535, 3461669, 94179, 121859, 94093, 100582, 121921, 530678, 94173, 94184, 3452538, 94187, 225334, 94186, 94168, 121861, 225337, 240570, 1905160, 121870, 656554, 100633, 100638, 100612, 121855, 100634, 94108, 100555, 1940779, 141931, 608413, 1156927, 225336, 100516, 325887, 121900, 3376060, 2707911, 94091, 94156, 94109, 275354, 559397, 94152, 1007630, 94127, 115304, 94146, 262983, 1533531, 100606, 100629, 94095, 94140, 94085, 121918, 94132, 258775, 94149, 273191, 309952, 100601, 94202, 1225443, 100631, 100621, 100627, 94158, 121917, 94199, 223211, 94126, 94114, 100556, 94192, 223918, 94103, 94206, 99984, 94100, 100563, 94102, 2723843, 223215, 252496, 94142, 100529, 100546, 1164710, 223917, 223202, 219666, 258771, 239806, 94133, 258879, 100604, 223197, 223198, 223201, 100616, 223204, 100511, 94196, 121909, 94122, 94194, 100636, 239919, 114390, 94171, 94191, 1382115, 94163, 100552, 94205, 631590, 94105, 223196, 100518, 100515, 1016257, 217635, 121910, 223213, 301309, 100524, 655612, 100632, 100613, 121915, 1987298, 223199, 1236686, 94136, 1510383, 1566903, 223195, 1863291, 223214, 100549, 223373, 1855057, 1409115], "Chicago": [841981, 87659, 220240, 90916, 235385, 114581, 111487, 223061, 1045286, 79228, 111509, 114578, 90976, 90955, 87573, 290675, 123293, 1200027, 1743591, 87595, 90922, 87627, 484081, 87576, 278718, 123234, 114583, 142296, 90952, 595763, 1642682, 123306, 123314, 1629781, 3572706, 3529874, 596421, 123290, 1632579, 123217, 123316, 123292, 123216, 123318, 655550, 123278, 123214, 1199683, 123285, 123219, 239958, 225103, 123288, 123289, 123227, 123229, 123301, 123302, 123235, 123236, 3572384, 123209, 123317, 123222, 488493, 123224, 123232, 774987, 676721, 1164776, 123230, 87600, 278717, 87610, 90918, 87613, 87656, 281340, 123225, 114600, 87566, 1149495, 591177, 299922, 87657, 90973, 90969, 650708, 87614, 87618, 87592, 114608, 273262, 1052716, 123319, 87590, 225108, 250023, 1186401, 1075753, 87635, 90766, 87608, 91042, 217510, 114577, 90986, 87665, 235386, 1477545, 498305, 90957, 90963, 1140049, 111501, 87648, 87617, 87620, 87629, 87602, 87637, 87645, 90762, 114604, 490891, 287568, 87571, 90985, 262831, 87638, 111500, 114595, 2525636, 2648906, 1389502, 87603, 90975, 1742256, 1235890, 87640, 1027237, 247154, 609738, 224036, 286793, 90959, 304277, 674288, 111486, 505788, 293203, 2042562, 87632, 236299, 111490, 619615, 111507, 217498, 87654, 1566945, 111492, 114591, 225105, 674283, 1516481], "Washington DC": [84095, 295751, 84064, 84132, 498950, 84087, 557199, 214097, 574805, 253068, 220075, 84127, 84092, 84082, 225100, 84080, 84051, 120613, 120559, 84060, 308189, 80689, 84083, 223893, 120592, 84078, 223031, 125477, 219444, 676149, 247085, 654218, 1175946, 1147664, 3671817, 84120, 3533199, 1197032, 1528551, 123837, 84076, 84033, 1095352, 1212709, 84026, 1204691, 217083, 84134, 75021, 123974, 84044, 1218625, 84038, 1515599, 84068, 84072, 80708, 84081, 939375, 225099, 120563, 84029, 266091, 120585, 1237013, 217767, 84074, 84137, 84067, 240271, 84052, 1456261, 120614, 84073, 120566, 600107, 84107, 84032, 84069, 84101, 84096, 84113, 84098, 84104, 224337, 1224560, 84039, 84129, 84070, 220047, 84125, 84086, 84062, 84079, 220076, 84100, 84084, 125476, 84066, 223900, 84048, 939976, 223897, 498949, 84041, 2038749, 1026016, 114575, 84058, 84075, 84115, 223032, 240907, 84047, 84122, 217770, 84131, 84109, 84118, 120556, 84090, 84065, 84093, 235513, 84117], "Fort Worth": [223888, 109119, 109211, 1222239, 109088, 109178, 109138, 98839, 224283, 2049085, 627514, 277885, 109111, 73551, 109205, 109130, 109187, 98846, 253357, 1640198, 565804, 3584883, 254242, 225117, 98853, 284866, 109215, 3400722, 109143, 98836, 547965, 109214, 244413, 98847, 98854, 244412, 73543, 73572, 98850, 109201, 273401, 73560, 122709, 224284, 294848, 226486, 225119, 98841, 109116, 109175, 109093, 570264, 109100, 1027019, 109156, 124453, 1101250, 268223, 225116, 672597, 320560, 241640, 109174, 109104, 225118, 676564, 98856, 543350, 98849, 223889, 224286, 225120, 223890, 2306647, 224285, 676704, 1515540, 109101, 2151620, 1382903, 109228, 109173, 189078, 114952, 109150, 574782, 483873, 1846740, 777199, 1137002, 647565, 1526953, 1852898, 249793, 1465151, 2533205, 1027025], "Jacksonville": [1415635, 659250, 84655, 120135, 553883, 84656, 1165021, 88401, 866480, 120174, 247710, 656530, 816774, 813034, 120159, 120161, 1503358, 261234, 1174688, 88451, 120170, 84650, 295756, 84647, 88425, 88416, 1024967, 84658, 84653, 84644, 84659, 217076, 1026989, 1025998, 88468, 84635, 120158, 120133, 286776, 120137, 120182, 1638519, 120157, 120106, 243711, 88405, 564631, 84664, 120128, 88429, 2296144, 226993, 239840, 120109, 88447, 88449, 84617, 88463, 88419, 555377, 88403, 120167, 656584, 1164991, 84660, 88436, 88444, 120141, 84626, 84637, 294735, 120171, 88456, 120131, 268199, 256866, 88440, 224590, 120124, 88400, 1946045, 84649, 120153, 88423, 120160, 1235779, 1819974, 88465, 1235363, 88410, 120147, 88402, 226846, 1164378, 88395, 88406, 120117, 88398, 84636, 84642, 88408, 252242, 120111, 88460, 1450901, 88417, 84661, 1127473, 1450903, 514468, 88442, 120138, 610906, 120123, 120186, 1176973, 84654, 88458, 223246, 120177, 472259, 1549318, 816772, 653217, 1223992, 1391989, 1566763, 1214730, 1201207, 781648, 1231084], "Denver": [85364, 82960, 85346, 82982, 83057, 82961, 81026, 85353, 223852, 119941, 111562, 83091, 114326, 1238865, 543093, 119998, 120000, 83086, 671614, 589144, 83044, 120087, 83095, 83104, 82992, 82976, 111550, 83061, 119948, 85375, 1634494, 85355, 119961, 119959, 119965, 119917, 119968, 119969, 814337, 1163603, 120035, 120039, 1147584, 1157227, 120051, 119911, 557874, 120085, 120086, 120090, 119950, 120042, 120006, 120040, 119928, 119981, 119975, 120099, 85343, 119929, 120014, 120003, 85338, 119949, 119939, 120017, 85638, 85330, 83060, 120036, 119914, 119923, 1176784, 85341, 119938, 270508, 85325, 120050, 83038, 85366, 225090, 85344, 119997, 85359, 83072, 225093, 120072, 85357, 81023, 83100, 82984, 83014, 83031, 120083, 83023, 530656, 1751673, 83051, 85332, 1238857, 83070, 1190033, 83081, 120029, 83099, 125845, 673588, 83046, 85372, 258669, 2554988, 218788, 119992, 85368, 578192, 85352, 83097, 1653655, 83020, 596431, 657868, 3369752, 1026992, 573340, 83093, 119993, 2085146, 83088, 120056, 2309623, 1737951, 308759, 578190, 120058, 83040, 878358, 530585, 1149434, 1845691, 1859056], "Los Angeles": [76049, 119382, 77264, 248239, 84505, 84517, 208191, 82491, 119483, 84555, 77888, 76793, 2236331, 77714, 81761, 77798, 223049, 84224, 76790, 272668, 82682, 83988, 223054, 504815, 1457221, 77866, 84529, 235456, 611195, 84320, 576828, 1528649, 84513, 577590, 77740, 549431, 113229, 271600, 1225375, 78679, 235134, 2370300, 313508, 84499, 1931273, 559383, 223050, 119492, 1645834, 282463, 570050, 223044, 256799, 549441, 271595, 84442, 81120, 240156, 939204, 1646145, 1636378, 530506, 271599, 1164770, 2482163, 271598, 1642672, 1643539, 271582, 3574043, 3575088, 1630627, 248554, 1645323, 1635388, 271609, 1646526, 1647578, 1629217, 271608, 1637029, 1641833, 1638991, 1646054, 248071, 3460043, 1628810, 271605, 1631741, 226151, 1630960, 3386634, 1646815, 3349317, 291208, 268678, 251538, 1529200, 77852, 82498, 1223148, 589309, 217240, 613619, 77761, 1186068, 575416, 217256, 119399, 82496, 3438742, 82305, 1591524, 3348276, 535826, 76446, 266004, 81285, 249704, 84202, 1642879, 235430, 271581, 247755, 1640422, 1743425, 1229893, 281769, 77809, 119390, 3364389, 271607, 244432, 817023, 271479, 77717, 271606, 291209, 84480, 271601, 271481, 1488816, 248069, 81763, 2232268, 2505057, 2521962, 634746, 276208, 84441, 119434, 226148, 2202132, 84365, 77753, 77262, 77260, 82304, 225809, 77859, 249692, 119422, 613137, 77729, 119414, 84483, 275366, 77844, 84434, 239812, 553344, 1752249, 84515, 1007413, 268977, 235133, 252254, 119464, 553345, 570515, 226056, 632541, 240151, 3337599, 82684, 84553, 119454, 2698092, 1488412, 82494, 223051, 76460, 82633, 77829, 78688, 113221, 84286, 1628828, 81768, 84437, 77923, 82689, 77247, 77282, 502971, 77870, 77277, 77237, 650376, 82578, 76325, 1657336, 84428, 223042, 77970, 119388, 657068, 249696, 84253, 240875, 81757, 1528623, 1963681, 223046, 77708, 630945, 82148, 84182, 77274, 2072559, 82656, 119443, 84167, 81765, 656235, 77931, 77874, 77256, 82318, 84422, 77232, 223013, 133994, 76061, 272703, 124956, 82679, 82636, 673130, 78037, 1456409, 82150, 1782807, 77917, 82650, 76442, 77944, 82501, 84453, 76458, 77243, 77787, 507339, 78046, 638765, 621153, 119479, 84522, 78694, 84463, 77700, 82686, 84440, 595476, 224168, 274223, 78682, 77827, 119421, 84561, 81170, 1100791, 1049387, 77270, 76083, 77775, 1563899, 77157, 1439222, 2154898, 249693, 77804, 111751, 223041, 1858565, 84502], "New York City": [113317, 99352, 93589, 217616, 208454, 2643161, 1465162, 93559, 80112, 93396, 1456560, 1641016, 1776857, 1762573, 93338, 224224, 75698, 1646128, 578305, 1940859, 99371, 1583937, 641209, 498869, 1500405, 93543, 93335, 1456411, 93419, 93467, 113309, 1025779, 1791248, 1878946, 99288, 99332, 1563892, 93435, 93337, 1157456, 93358, 1383001, 99382, 1379306, 93464, 624442, 93382, 1963673, 1786395, 93351, 1007724, 93561, 217623, 121987, 617306, 93334, 502407, 2622936, 93390, 93475, 80107, 112053, 1027901, 99321, 1858923, 93565, 93575, 93437, 673077, 93376, 99302, 93625, 247814, 290978, 93517, 93333, 93345, 217629, 1149404, 112066, 235228, 99357, 93526, 99443, 3168954, 234762, 121981, 99766, 93344, 125274, 673080, 246797, 93440, 93401, 93364, 219622, 1448670, 598980, 214197, 3506933, 249780, 122007, 260396, 616887, 121985, 1872507, 234764, 1146076, 1165409, 122011, 217613, 1206876, 93356, 557499, 1147661, 1547031, 284904, 1699664, 1141305, 1990870, 665814, 1164614, 3533197, 2554351, 3580899, 3613090, 224220, 671821, 224225, 93418, 1529345, 3411847, 3236642, 3529145, 3572583, 252870, 1158761, 1820216, 1177257, 646442, 3344640, 247982, 234766, 234765, 235235, 1146278, 1484261, 1146129, 1203394, 671822, 3572587, 3502291, 673661, 99287, 540545, 1176643, 267183, 580078, 224229, 2027969, 290982, 2109422, 543021, 93380, 651216, 225944, 1201662, 239836, 93384, 774805, 281695, 254281, 93572, 122022, 235236, 530265, 268218, 268217, 1049347, 320562, 3583686, 662519, 99292, 1199940, 1961167, 1161809, 249710, 1207461, 93421, 1170336, 1497765, 1575440, 1199530, 651265, 1155229, 290987, 256738, 1161790, 1161789, 93539, 113343, 93357, 80093, 1217376, 1175436, 249656, 224217, 649058, 142114, 1938661, 1164645, 93470, 267182, 75711, 93520, 3541823, 1146072, 113297, 1497821, 596200, 80081, 223023, 616735, 93438, 80075, 93581, 99447, 217627, 550885, 1048678, 1465008, 208888, 671150, 674743, 93633, 93545, 564851, 643970, 655870, 99307, 93403, 223022, 112062, 122015, 93374, 93339, 93486, 223021, 112019, 217622, 93466, 99774, 93586, 93612, 2151571, 99365, 75688, 93398, 93593, 281697, 93359, 281234, 292140, 99333, 584986, 93452, 93622, 287626, 611947, 1234559, 93555, 208455, 209382, 1128769, 93579, 1214829, 630950, 93489, 93450, 99388, 1181739, 488793, 1217245, 249711, 2096704, 112041, 93607, 93379, 1783324, 99391, 1462005, 112039, 1464151, 126257, 1218720, 518280, 1177864, 93618, 93583, 93571, 1390172, 1486164, 607712, 609602, 99425, 254605, 1477775, 93516, 224223, 80110, 1485603, 1733337, 220243, 575732, 122014, 99387, 1235341, 224226, 194238, 121991, 93383, 121996, 122005, 1308397, 223019, 455186, 1158763, 122004, 1553789, 3235844, 93568, 313862, 262330, 1139717, 1595302, 601762, 112021, 217630, 1601249, 2173604, 93569, 1149402, 225942, 93562, 121998, 251906, 80083, 502408, 93462, 93477, 514488, 99368, 249712, 612263, 1237128, 632551, 620040, 157057, 1060157, 1201072, 93346, 121999, 75737, 1949647, 93430, 93606, 277882, 675616, 93454, 93431, 112064, 93507, 1806062, 866615, 93445, 217626, 571166, 235238, 620399, 268216, 1371825, 99354, 99281, 2148819, 93610, 93603, 113298, 222959, 281071, 99392, 113311, 1785018, 1186070, 99327, 1845644, 208452, 126260, 2079052, 223024, 292142, 93614, 113300, 93534, 273530, 1158753, 113329, 1218792, 634696, 93624, 2253206, 208453, 93352, 1913413, 93457, 630409, 93585, 93623, 80087, 93566, 93525, 112052, 1485961, 224214, 1746459, 80092, 1028569, 1456416, 1415127, 1888977, 1572980, 1503474, 93340, 99762, 224221, 122020], "Dallas": [109571, 114948, 622920, 98733, 109335, 109367, 1493264, 98606, 109353, 585414, 109345, 98609, 98728, 3432111, 122715, 109456, 659532, 224228, 114942, 98647, 98640, 109427, 109426, 109371, 224240, 109474, 109412, 98719, 111538, 98644, 217721, 109438, 98638, 109487, 124066, 589369, 109062, 98653, 1631539, 260923, 223056, 109407, 109479, 244325, 1994522, 224237, 109352, 98690, 239867, 1633428, 589535, 1201122, 1163788, 1209208, 1637827, 223055, 1635592, 508172, 2012023, 2685183, 1951637, 1628732, 98707, 1210969, 98620, 2501834, 2025808, 122724, 1865638, 1638710, 2508014, 98708, 1629801, 98652, 109379, 224236, 224222, 109309, 109471, 2043022, 98663, 109277, 109455, 98617, 98623, 209356, 98664, 98666, 1175089, 656704, 1147227, 224235, 109075, 1214715, 98657, 98695, 239871, 557588, 98721, 258628, 1474749, 1176822, 98694, 217715, 98713, 217717, 109035, 122721, 98675, 109453, 109454, 223045, 98712, 223632, 1221734, 98704, 656305, 109325, 98628, 109493, 98678, 109399, 98622, 109039, 611182, 73644, 109389, 98627, 109391, 109339, 223887, 217716, 98686, 224241, 98685, 98631, 98730, 109789, 1218038, 223053, 122699, 98683, 652607, 109347, 98717, 98639, 109351, 1235854, 98651, 98641, 1657223, 224218, 224227, 98650, 543081, 601262, 109374, 98679, 109370, 224130, 98634, 109334, 109452, 98731, 259593, 98655, 258626, 1526976, 109336, 600113, 280902, 109231, 98629, 111530, 1845655, 109413, 109468, 98710, 2192761, 98727, 109404, 1113787, 98726, 2280220, 602600, 122703], "Memphis": [775880, 105275, 645386, 98031, 249713, 223752, 105151, 105236, 223886, 111855, 105190, 672520, 105192, 225338, 1676324, 114850, 105281, 239950, 858538, 105207, 223744, 98045, 1138079, 73880, 146517, 105177, 105265, 105184, 98019, 295791, 105247, 98036, 98077, 105194, 98058, 98034, 122584, 223758, 105256, 125626, 105160, 73886, 122499, 1221737, 239352, 656552, 224184, 239353, 223768, 286985, 122495, 223104, 98037, 98028, 122551, 3250815, 98051, 122525, 122554, 122556, 122510, 1638500, 122533, 122568, 122575, 122494, 98053, 122507, 105198, 98018, 98069, 293232, 98071, 243751, 98048, 122561, 98023, 98056, 224185, 98055, 98075, 122504, 122567, 105222, 98032, 98057, 122543, 1146051, 122502, 122542, 105186, 98050, 275455, 105156, 98020, 1804272, 111860, 816268, 105191, 98073, 223773, 248601, 105272, 223770, 105241, 576374, 1485414, 122583, 98070, 105188, 220079, 98021, 105170, 98062, 258813, 614758, 268694, 98039, 122581, 1022627, 1147150, 224306, 105180, 223774, 1474319, 310409, 105238, 1778319, 223103], "Phoenix": [73943, 115484, 266322, 224757, 75662, 223861, 73957, 224250, 112178, 73896, 74758, 74805, 642935, 73937, 73792, 142098, 118790, 73760, 73727, 74652, 244405, 1176612, 73712, 119335, 565626, 1646954, 73977, 119366, 118784, 248362, 1649037, 1633339, 119332, 74673, 1175228, 224748, 1146211, 118791, 248360, 268588, 118795, 119311, 119361, 119331, 73985, 1926212, 73803, 1036415, 73869, 73743, 74561, 74724, 248145, 73768, 223039, 73982, 74687, 217199, 118794, 2309045, 74732, 119314, 239801, 73817, 73884, 74720, 74410, 243927, 1164638, 73875, 112175, 73882, 74657, 73782, 118793, 119337, 224749, 74739, 73718, 248361, 1160848, 217193, 1160841, 73910, 74936, 74816, 74752, 74744, 73889, 73773, 73825, 1026671, 3405788, 73905, 119327, 73927, 74587, 3513445, 218100, 112162, 73859, 3156712, 73840, 248358, 73799, 73950, 239947, 73821, 118775, 119330, 119355, 239800, 262398, 271801, 1963064, 240681, 543136, 74583, 223036, 73751, 74669, 73706, 73855, 73805, 73862, 74548, 74826, 74590, 73787, 74545, 73810, 277997, 119351, 73739, 74624, 866698, 754229, 313465, 115483, 729371, 119356, 866697, 118778, 115482, 112179, 1174692, 224733, 223273, 74834, 74626, 677854, 112154, 119353, 1158679, 240682, 119363, 816807, 286542, 223035, 74927, 1176581, 1485459, 1657449, 1201061, 74845, 73757, 634649, 73947, 1605022, 119365, 223860, 1147292, 73923, 1200121, 564652, 225578, 2015227, 2627745], "San Diego": [268157, 658421, 1147616, 665258, 112279, 80251, 268158, 82868, 79868, 79954, 287392, 80255, 80668, 482154, 218770, 80219, 80232, 217273, 235416, 80131, 79913, 80588, 218939, 79985, 83500, 223026, 83637, 80154, 119721, 119733, 80138, 247027, 226611, 224497, 80360, 79921, 225848, 119780, 80570, 78152, 80033, 80019, 82443, 80192, 119762, 80615, 1640258, 119734, 119726, 313514, 226607, 119776, 586465, 226602, 80244, 258654, 80280, 115612, 1158999, 550898, 550897, 550896, 559686, 550894, 225852, 1146136, 550899, 1146215, 83730, 1146141, 225851, 268152, 2239487, 80585, 1633360, 550893, 3431031, 550892, 1147592, 550888, 1146352, 1147255, 1201989, 80249, 119765, 79888, 123716, 635040, 266324, 80276, 80246, 80126, 83489, 226601, 224489, 83092, 82596, 83372, 1104554, 80350, 590139, 1508604, 112280, 119755, 79880, 80014, 119748, 79977, 650054, 79896, 80004, 82436, 119735, 80094, 550891, 83575, 1100081, 80530, 80189, 254300, 266323, 80096, 83958, 1109434, 82688, 1451746, 224494, 272663, 1647864, 80311, 585279, 280605, 623586, 226623, 295745, 79942, 240889, 83322, 80291, 119746, 223025, 80011, 226612, 83895, 224353, 119716, 119753, 141999, 80580, 83259, 80161, 80167, 80106, 76741, 80618, 83711, 81797, 119742, 80423, 224490, 223776, 79930, 80223, 80593, 82478, 224242, 80193, 556822, 119710, 501297, 80643, 285427, 80266, 194176, 80582, 218778, 218777, 80198, 80133, 119729, 80067, 602719, 631235, 80327, 80733, 79873, 80562, 83660, 80602, 119768, 82821, 518294, 79971, 79981, 212059, 258655, 79902, 83361, 628619, 119728, 80654, 80590, 112247, 80109, 223027, 119730, 112258, 223220, 115598, 601802, 226619, 112281, 83078, 223973, 1011240, 83646, 272662, 79907, 80129, 244513, 78135, 625335, 80113, 113905, 218780, 83245, 81352, 80227, 115613, 119732, 1237001, 1502048, 574448, 498304, 571835, 119769, 80735, 543517, 1027494, 112253, 678597, 656430, 112273, 268155, 781627], "Austin": [181851, 604455, 1201024, 223620, 109000, 108966, 142074, 1866954, 108977, 1382102, 604457, 223680, 109004, 98474, 3263489, 98457, 98420, 108965, 1174687, 240526, 223707, 108961, 247103, 98433, 108964, 73759, 217735, 291290, 109001, 285294, 226433, 98441, 223684, 1221539, 108990, 142349, 98462, 111390, 108994, 108974, 608007, 223685, 220077, 108991, 108975, 656307, 288725, 223683, 217730, 108986, 243922, 98472, 109008, 98443, 226434, 1147269, 288724, 290548, 98437, 3531459, 290544, 3530783, 109005, 288747, 1206940, 268523, 223693, 223692, 620237, 1147682, 288745, 98409, 3505865, 291283, 284421, 217731, 1635868, 109013, 291287, 239890, 239891, 108998, 247102, 288743, 98467, 291291, 142018, 243756, 98405, 675150, 98415, 98439, 223678, 220106, 109010, 109007, 273366, 108988, 108984, 98424, 225440, 288742, 98447, 98416, 217732, 109002, 217736, 98413, 108963, 108995, 288732, 98438, 108987, 223675, 109009, 223713, 223714, 98435, 108999, 223679, 142017, 108983, 98428, 109006, 111377, 252821, 108997, 1176838, 108976, 1025910, 1571800, 109015, 111397, 108972, 98426, 566802, 98452, 217734, 526841, 73763, 108979, 108969, 1573301, 98445, 98436, 98464, 111381, 108971, 108996, 282698, 108962, 223686, 1173092, 259008, 98419, 252820, 98418, 111395, 570293, 252313, 566803, 223691, 109012, 98463, 108967, 223695, 82013, 98453, 1224950, 108982, 1189576, 3523356, 108981, 622833, 615166, 1751886, 557377, 1023853, 1889883, 1675976, 108980, 111393, 2008152, 1762662, 114938], "Baltimore": [223985, 656449, 1147514, 89327, 309189, 89343, 224642, 1479971, 89344, 89333, 275870, 674606, 93889, 89358, 1751278, 89331, 124839, 624736, 89357, 89325, 313947, 124186, 93846, 1628876, 1156515, 1146898, 89332, 604930, 120951, 89362, 1629271, 89326, 574054, 1950129, 1206970, 93886, 631880, 1174784, 610125, 89353, 1436140, 89340, 225246, 89367, 217536, 89346, 225792, 291397, 89365, 1465016, 89351, 89382, 89361, 1007816, 89337, 77730, 100407, 120957, 1164933, 89336, 93892, 566439, 1821731, 223983, 1449313, 625154, 111408, 2196840, 2322597], "San Antonio": [2039194, 258651, 1236032, 99458, 123559, 2340364, 1732285, 1200768, 611291, 2151543, 99455, 1438859, 1674220, 1353074, 570285, 645211, 108932, 1116329, 953773, 676703, 108703, 223706, 223712, 1200881, 223058, 497953, 240451, 1175533, 108408, 108382, 1165284, 108534, 99445, 99487, 99420, 108533, 2064903, 99441, 99450, 1164501, 108913, 465532, 223696, 108736, 108936, 1465109, 99499, 99416, 1562631, 223697, 108943, 1164348, 108791, 273367, 225490, 99464, 1163830, 1021483, 1235859, 244322, 108577, 259215, 240452, 590753, 240568, 108206, 108642, 1165123, 99418, 604553, 108171, 240457, 99527, 99497, 223690, 99508, 108190, 99513, 108939, 108608, 108935, 223687, 293240, 99536, 223703, 1528530, 99501, 99431, 222987, 501431, 831103, 491073, 247839, 472231, 239357, 108933, 99542, 108857, 99521, 577395, 108219, 260945, 530411, 295487, 643318, 625462, 99502, 3411220, 2462694, 3366043, 514464, 1640920, 99460, 99459, 2299548, 1213585, 2510946, 1632769, 1638918, 108153, 108493, 1636046, 99519, 3377958, 1629164, 3378444, 99516, 240569, 2462661, 285811, 626899, 508145, 1643343, 1638992, 3417419, 99405, 1628885, 1645896, 1177746, 1630782, 1631657, 108253, 108938, 108255, 123710, 108426, 239973, 239967, 108303, 239968, 108941, 1209962, 99414, 108934, 244321, 244319, 99514, 1643616, 259218, 260935, 239972, 559584, 1146357, 483322, 1743841, 249576, 550977, 240487, 99452, 239974, 239966, 99540, 108252, 99506, 108158, 99472, 1486231, 122790, 99515, 108931, 631249, 99446, 99439, 2554690, 108154, 216867, 1209478, 73250, 1177260, 645210, 108831, 99417, 99419, 1014760, 122791, 1177887, 254917, 1201142, 108260, 614530, 108574, 497952, 226014, 108251, 534695, 99461, 73236, 99421, 146138, 99518, 252502, 614476, 239971, 223229, 569882, 1741181, 621644, 108444, 124464, 534709, 590278, 223662, 320058, 99451, 99476, 248120, 223689, 108701, 99485, 99504, 1382269, 247773, 508084, 99480, 108562, 108522, 108339, 1139002, 1212773, 2549268, 108233, 217757, 108391, 108922, 108364, 99531, 108250, 268525, 108487, 108676, 73242, 99495, 1479977, 146143, 1762310, 574244, 108361, 99434, 109753, 99423, 108521, 1657244, 99438, 123557, 1382347, 99470, 223708, 1676193, 1144554, 112240, 1552856, 99433, 877968, 677533, 881708, 99462, 277948, 108884, 247123, 108306, 675441, 575206, 657967, 123556, 645212, 223716, 99489, 99494, 1229785, 1858821, 99468, 1673471, 223057, 1856923, 112231, 553469, 1200634, 99437, 1156873, 657719, 617387, 1421297, 99440, 1028312, 1477755, 858424, 108908, 1100734, 99530, 223715, 1006634, 498346, 1479635, 112227, 1390173, 223669, 223230, 1146124, 108763, 99453, 2516677, 1566913, 99488, 1514210, 608241, 1688532, 320049, 2155705, 112229, 239912, 108254, 1584731, 625299, 656713, 269651, 108571, 1723698, 2554348, 99535, 1929352, 1140713, 1673679, 288617], "Detroit": [90003, 234922, 95306, 530320, 95305, 95312, 1647936, 1901088, 89995, 605656, 89998, 114654, 1190550, 95308, 89999, 95300, 234917, 1633346, 2156247, 94554, 674740, 224064, 95294, 256897, 114661, 288605, 1230421, 1236680, 674735, 782678, 95302, 242702], "Indianapolis": [576787, 730126, 88177, 1502098, 564589, 91429, 91513, 223830, 287572, 278567, 1008650, 91553, 88158, 1214250, 88151, 91450, 91428, 1156950, 88175, 88172, 88164, 91544, 91607, 91502, 88159, 1520042, 91446, 240139, 1026913, 224819, 120770, 91484, 240136, 91443, 665394, 88140, 260932, 635243, 144736, 91338, 91608, 268137, 1158846, 1164179, 268138, 268135, 243720, 249677, 120784, 120786, 3580893, 124015, 582205, 268139, 240185, 88154, 1161248, 268136, 259022, 88148, 91561, 217026, 91436, 586270, 91490, 120802, 120795, 120811, 278566, 120810, 240187, 275739, 91442, 120774, 120777, 223208, 141972, 88153, 78887, 1627952, 239898, 120767, 241032, 251963, 518323, 88138, 120796, 288193, 88143, 120803, 91515, 120813, 91496, 265878, 224809, 224830, 88150, 91477, 91542, 91599, 224799, 91506, 91432, 91605, 91522, 91475, 223829, 273699, 120766, 91454, 91458, 91573, 278568, 88161, 91435, 91494, 1759407, 120783, 631597, 88155, 91474, 631598, 88186, 223363, 91457, 91609, 1114620, 91551, 224820, 240134, 530673, 88144, 1567301, 224810, 1641470, 224814, 223827, 91519, 1239568, 91479, 88162, 91500, 674056, 224793, 91488, 278565, 91462, 1235801, 88168, 656462, 88188, 114631, 91509, 91602, 653125, 111624, 634658, 91441, 224831, 91440, 1514254, 224259, 1201174, 91596, 91491, 582252, 120798, 1456709, 120794, 224832, 111623, 91558, 88173, 1479845, 1592809, 91527, 223833, 91577, 88171, 1236866, 1206274, 1008647, 1762915], "San Francisco": [119657, 80747, 80780, 81456, 81514, 81165, 81022, 81450, 112307, 618542, 224956, 81985, 506418, 119601, 217844, 654030, 478253, 81459, 81461, 1119270, 81114, 82116, 80808, 81038, 81520, 80774, 112328, 119658, 112360, 81363, 81049, 80930, 627267, 81251, 80757, 81241, 81503, 112335, 81416, 81212, 291220, 80768, 112321, 80817, 1015196, 320147, 119663, 603022, 80978, 626656, 240893, 81524, 291689, 658566, 81379, 81480, 119636, 674036, 571428, 1201115, 268241, 224960, 595097, 275488, 1160927, 291332, 1641819, 112304, 1840699, 81246, 81487, 282764, 81526, 565629, 113924, 549444, 252811, 119632, 278862, 80766, 82105, 944406, 3165345, 80760, 1160908, 1223830, 1160921, 81256, 224957, 654032, 81150, 291071, 1546311, 1214408, 226814, 80987, 80799, 81383, 80806, 142261, 256730, 80950, 226829, 119637, 571427, 80788, 119650, 81007, 80756, 267364, 1973577, 217294, 1800858, 81976, 570865, 113927, 80821, 124967, 510378, 80977, 81782, 119590, 81959, 119661, 288687, 224955, 2236788, 119625, 291695, 82114, 81075, 80836, 1833071, 81004, 81476, 112325, 80879, 74059, 81035, 80920, 81418, 218776, 489082, 80771, 112289, 141997, 1134288, 80963, 119626, 80753, 80823, 81367, 226834, 81237, 81177, 119640, 80786, 81466, 119593, 80864, 243535, 113942, 81042, 81375, 81531, 281778, 224951, 112320, 81295, 81222, 112311, 563989, 81377, 268240, 279426, 81529, 223955, 81141, 81103, 113923, 311255, 81803, 112303, 80925, 81169, 81087, 112338, 81215, 81315, 119623, 119643, 119665, 81249, 217813, 80802, 291227, 112293, 80917, 81110, 81209, 80793, 115623, 115617, 81082, 81669, 81192, 81397, 113928, 81019, 81204, 81444, 124765, 113940, 80999, 112347, 80937, 676408, 115625, 310867, 81511, 501344, 80797, 574449, 80990, 224958, 115644, 112373, 81126, 268533, 81394, 224953, 247005, 81409, 224948, 80983, 1175274], "Houston": [1866401, 99060, 1218737, 99081, 107915, 1966350, 108038, 1200103, 283873, 98952, 107956, 1158926, 282699, 239853, 665163, 111618, 99114, 107924, 223151, 223137, 258636, 98920, 1236706, 108057, 240436, 266158, 559491, 1630591, 99106, 242394, 108148, 99067, 585164, 98987, 107863, 258634, 108054, 223158, 1773009, 107834, 223154, 223164, 108149, 142023, 223148, 99132, 108020, 108150, 223141, 223160, 223179, 99101, 596014, 815515, 256700, 256702, 2712053, 650546, 99004, 223149, 98989, 107930, 99041, 1627951, 486939, 558146, 258635, 1636050, 266326, 1155392, 107884, 1514581, 98964, 595438, 1160746, 99013, 107846, 1146185, 226728, 239859, 98962, 223178, 98940, 107802, 277895, 108136, 488773, 223156, 107903, 217745, 107769, 223135, 122746, 226721, 107713, 142353, 266125, 596446, 98976, 223183, 223184, 107757, 2340286, 99051, 1382899, 244313, 99098, 277892, 1164945, 98937, 99031, 73463, 1146238, 1147065, 98972, 107999, 239355, 239858, 1647666, 2686185, 223185, 1901114, 1901111, 99000, 108137, 3627162, 558427, 634695, 1643419, 1633636, 240438, 249655, 1630761, 1237870, 1175129, 99091, 2152775, 1631148, 268142, 1163572, 1007915, 1645965, 99094, 1647932, 1636047, 109740, 243103, 645216, 108022, 665252, 652950, 3346006, 1632485, 258878, 268150, 258633, 223168, 258632, 3308100, 1644317, 1147485, 602892, 2673301, 107772, 3564333, 1180363, 1640475, 98946, 1637168, 1633640, 98934, 109734, 247110, 99131, 257503, 73470, 240481, 239857, 99024, 122740, 503045, 2367166, 240443, 240444, 240445, 240446, 99045, 244316, 107787, 292556, 107911, 141902, 570195, 108006, 107743, 244314, 141893, 651629, 240435, 244196, 254040, 223194, 1751874, 240440, 107751, 223138, 98970, 603138, 558038, 108029, 217739, 98981, 98986, 649739, 239848, 98936, 223182, 108151, 108047, 223187, 107952, 252340, 653244, 1484167, 1224357, 1858908, 99017, 108145, 107768, 570092, 223180, 223175, 503400, 559409, 240483, 98955, 631351, 108066, 99082, 108060, 223157, 1138042, 557401, 1577352, 1971740, 244310, 223169, 99073, 99015, 107812, 217741, 240441, 223140, 107867, 223136, 258875, 223176, 109748, 1526288, 239356, 223177, 2160816, 240437, 1889985, 1583951, 2531544, 99014, 1724101, 1485278, 107718, 109742, 116265, 107859, 1212489, 1642905, 98997, 223172, 108010, 107913, 1146180, 107994, 107993, 223150, 223192, 3393901, 223144, 257022, 223143, 124460, 98999, 99104, 268149, 1158744, 1174691, 109751, 1416435, 217746, 257507, 1549134, 107844, 98959, 73481, 223167, 107957, 107990, 108002, 223153, 1222237, 223165, 98996, 223152, 1733514, 98966, 99120, 107783, 240439, 123943, 107929, 108142, 223139, 107947, 223159, 1236696, 98954, 107711, 268145, 223142, 1197126, 223171, 99103, 107776, 223155, 124937, 1645644, 98944, 674319, 223166, 1649109, 657890, 217744, 223193, 99066, 223228, 1103488, 878451, 107908, 98943, 98991, 1657341, 107954, 223147, 223189, 108004, 223134, 99007, 1556786, 99010, 108061, 99058, 288460, 99135, 1575212, 107826, 645215, 1863251, 107982, 99006, 671200, 1440365, 98956, 277894, 220094, 107986, 99110, 226753, 107856, 609502, 99116, 286987, 1026192, 107991, 812523, 293234, 268151, 286988, 1237172, 525232, 239865, 223173, 1478311, 1724007, 641273, 608401, 631349, 1846923, 570279, 99137, 266145, 1852890, 1100784, 223227, 223145, 530458, 622987, 518371, 596013, 1511925, 99055, 1879027, 219703, 223146, 99054, 1015206, 3191802, 107836, 578694, 615260, 99109, 247108, 108141, 1205162, 266157, 1573321, 1438752, 98979, 1862847, 3236579, 73445], "Columbus": [246937, 123896, 95288, 1546086, 223728, 95253, 223755, 95284, 223509, 217654, 217653, 612540, 95241, 122230, 101657, 223749, 223753, 101661, 223730, 95285, 101647, 1628583, 101668, 223732, 1218847, 223764, 240079, 101660, 240082, 1225684, 1206195, 269926, 3450665, 2665542, 95243, 1175470, 1177485, 3532587, 90214, 101649, 95264, 1804281, 101665, 223734, 223767, 95236, 95240, 222972, 101757, 101670, 223762, 223772, 240078, 95275, 101635, 95242, 95271, 223763, 75212, 101643, 3574675, 114725, 95263, 223766, 223759, 101653, 1191338, 223737, 90216, 95235, 281206, 223765, 123895, 101640, 1643250, 101639, 223756, 123898, 101659, 101651, 101641, 101646, 101636, 95261, 223775, 124435, 95286, 223760, 95246, 626349, 240076, 249788, 95230, 95252, 896855, 223742, 95258, 75221, 95250, 75206, 95289, 95277, 95249, 122229, 1238209, 223726, 95293, 250903, 223223, 281777, 675842, 95265, 95247, 265892, 122237, 1382787, 95269, 95238, 268516, 223771, 223747, 223739, 518306, 223748, 223724, 1479195, 3400639, 223735, 2154314, 1200977, 258165, 278081, 223750, 2151296, 819653, 1157336, 1804801, 878115, 1588429, 1415082], "Philadelphia": [1510002, 102472, 122332, 96737, 102480, 96705, 249126, 112145, 96712, 102463, 102550, 112132, 224279, 220059, 112136, 1479774, 102510, 220057, 102492, 122326, 225277, 1147532, 543627, 595059, 122337, 122324, 122328, 1778574, 96684, 1861737, 122335, 1097234, 102509, 1164882, 74370, 96715, 102495, 96730, 102539, 142181, 102503, 115448, 102542, 271793, 220058, 102537, 96721, 102519, 102707, 96726, 1176615, 112137, 115444, 96688, 1022889, 96698, 125307, 112129, 102710, 217682, 225275, 123541, 96686, 247008, 96711, 102466, 122325, 112134, 483277, 112124, 74363, 122343, 662409, 499019, 1091941, 224280, 122315, 226730, 3186945, 96735, 3226761], "El Paso": [2351689, 108945, 675767, 1235675, 108948, 240001, 225039, 73595, 1514287, 281755, 225031, 501984, 98827, 98819, 98805, 620239, 108955, 98809, 108958, 108953, 108959, 108946, 98817, 98808, 254913, 3215497, 98797, 1631049, 502974, 244399, 98820, 240000, 98814, 1875844, 98800, 225037, 225040, 225036, 98806, 225032, 490892, 2533204, 108957, 277881, 141894, 73589, 98824, 919225, 108944, 98798, 98825, 98815, 108956, 288559, 98804, 98802, 240621, 225041, 635070, 225038, 1175958, 98818, 98812, 652847, 225033, 225035, 1479831, 98810, 98821, 850464, 1878688, 1465226, 1485688, 108947, 225034, 1961981, 2145772]}
data/cmu/processed/hotel_id_to_name_map.json ADDED
The diff for this file is too large to render. See raw diff
 
data/cmu/processed/hotel_id_to_review_map.json ADDED
The diff for this file is too large to render. See raw diff
 
data/cmu/processed/score_threshold_per_city.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"Boston": 4.3816753729941, "Seattle": 4.292929292929293, "San Jose": 3.9189870025458933, "Charlotte": 4.078947368421052, "Chicago": 4.307793286806248, "Washington DC": 4.2648215648046115, "Fort Worth": 4.314204867006225, "Jacksonville": 4.201680672268908, "Denver": 4.1421869328493655, "Los Angeles": 3.9518072289156625, "New York City": 4.333333333333333, "Dallas": 4.115384615384615, "Memphis": 3.8454048993602745, "Phoenix": 4.174902912621359, "San Diego": 4.172192731727236, "Austin": 4.074248366013072, "Baltimore": 4.269613821138212, "San Antonio": 4.109909909909909, "Detroit": 4.015418719211822, "Indianapolis": 4.1498564593301435, "San Francisco": 4.16015625, "Houston": 4.1083121597096195, "Columbus": 4.0, "Philadelphia": 4.233009708737864, "El Paso": 4.113419913419913}