Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Moving dependence from custom branch's tour_model to master's trip_model #933

Merged
merged 10 commits into from
Sep 14, 2023
16 changes: 13 additions & 3 deletions emission/analysis/modelling/similarity/od_similarity.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,16 @@ def extract_features(self, trip: ecwc.Confirmedtrip) -> List[float]:
return ctfe.od_features(trip)

def similarity(self, a: List[float], b: List[float]) -> List[float]:
o_dist = ecc.calDistance([a[0], a[1]], [b[0], b[1]])
d_dist = ecc.calDistance([a[2], a[3]], [b[2], b[3]])
return [o_dist, d_dist]
"""
a : a list of point features that can take either of two forms
1. [point1_latitude,point1_longitude]
2. [point1_latitude,point1_longitude,point2_latitude,point2_longitude]

b : a list of point features that can take either of two forms
1. [point1_latitude,point1_longitude]
2. [point1_latitude,point1_longitude,point2_latitude,point2_longitude]
"""
point_dist = [ecc.calDistance(a[i:i+2], b[i:i+2])
shankari marked this conversation as resolved.
Show resolved Hide resolved
for i in range (0,len(a),2)]

return point_dist
14 changes: 5 additions & 9 deletions emission/analysis/modelling/similarity/similarity_metric.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,21 +27,17 @@ def similarity(self, a: List[float], b: List[float]) -> List[float]:
"""
pass

def similar(self, a: List[float], b: List[float], thresh: float, clusteringWay :str = 'origin-destination') -> bool:
def similar(self, a: List[float], b: List[float], thresh: float) -> bool:
"""compares the features, returning true if they are similar
within some threshold

:param a: features for a trip
:param a: features for a trip ,
:param b: features for another trip
:param thresh: threshold for similarity
:clusterinWay: clustering based on origin/destination/origin-destination-pair
:clusteringWay: clustering based on origin/destination/origin-destination-pair
:return: true if the feature similarity is within some threshold
"""
similarity_values = self.similarity(a, b)
shankari marked this conversation as resolved.
Show resolved Hide resolved
if clusteringWay == 'origin':
is_similar = similarity_values[0] <= thresh
elif clusteringWay == 'destination':
is_similar = similarity_values[1] <= thresh
else:
is_similar = all(map(lambda sim: sim <= thresh, similarity_values))
is_similar = all(sim <= thresh for sim in similarity_values)
shankari marked this conversation as resolved.
Show resolved Hide resolved

return is_similar
Original file line number Diff line number Diff line change
Expand Up @@ -207,14 +207,22 @@ def _find_matching_bin_id(self, trip_features: List[float]) -> Optional[str]:
finds an existing bin where all bin features are "similar" to the incoming
trip features.

:param trip_features: feature row for the incoming trip
:param trip_features: feature row for the incoming trip.
takes the form [orig_lat, orig_lon, dest_lat, dest_lon]
:return: the id of a bin if a match was found, otherwise None
"""
for bin_id, bin_record in self.bins.items():
matches_bin = all([self.metric.similar(trip_features, bin_sample, self.sim_thresh,self.clusteringWay)
for bin_sample in bin_record['feature_rows']])
if matches_bin:
return bin_id
if self.clusteringWay == 'origin':
shankari marked this conversation as resolved.
Show resolved Hide resolved
start,end=0,2 #since first two features in trip_features are for origin
elif self.clusteringWay == 'destination':
start,end=2,4 #third and fourth values intrip_features are for destination
elif self.clusteringWay == 'origin-destination':
start,end=0,4 #when clusteromgWay is 'origin-destination',we pass all four features

matches_bin = all([self.metric.similar(trip_features[start:end], bin_sample[start:end], self.sim_thresh)
for bin_sample in bin_record['feature_rows']])
if matches_bin:
return bin_id
return None

def _nearest_bin(self, trip: ecwc.Confirmedtrip) -> Tuple[Optional[int], Optional[Dict]]:
Expand Down