Skip to content

Commit 57b3887

Browse files
Chen Zhilingfeast-ci-bot
authored andcommitted
Deduplicate rows in subquery (feast-dev#409)
* Deduplicate rows in subquery * Rename columns * Use correct feature names * Select k.* instead of iterating through fields
1 parent 2b291a3 commit 57b3887

1 file changed

Lines changed: 10 additions & 2 deletions

File tree

serving/src/main/resources/templates/single_featureset_pit_join.sql

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ SELECT
1515
{{ featureSet.entities | join(', ')}},
1616
false AS is_entity_table
1717
FROM `{{projectId}}.{{datasetId}}.{{ featureSet.project }}_{{ featureSet.name }}_v{{ featureSet.version }}` WHERE event_timestamp <= '{{maxTimestamp}}' AND event_timestamp >= Timestamp_sub(TIMESTAMP '{{ minTimestamp }}', interval {{ featureSet.maxAge }} second)
18-
)
18+
), joined AS (
1919
SELECT
2020
uuid,
2121
event_timestamp,
@@ -44,4 +44,12 @@ SELECT
4444
{% endfor %}
4545
FROM `{{projectId}}.{{datasetId}}.{{ featureSet.project }}_{{ featureSet.name }}_v{{ featureSet.version }}` WHERE event_timestamp <= '{{maxTimestamp}}' AND event_timestamp >= Timestamp_sub(TIMESTAMP '{{ minTimestamp }}', interval {{ featureSet.maxAge }} second)
4646
) USING ({{ featureSet.project }}_{{ featureSet.name }}_v{{ featureSet.version }}_feature_timestamp, created_timestamp, {{ featureSet.entities | join(', ')}})
47-
WHERE is_entity_table
47+
WHERE is_entity_table
48+
)
49+
SELECT
50+
k.*
51+
FROM (
52+
SELECT ARRAY_AGG(row LIMIT 1)[OFFSET(0)] k
53+
FROM joined row
54+
GROUP BY uuid
55+
)

0 commit comments

Comments
 (0)