Skip to content

Commit 2c61ff7

Browse files
committed
fix
1 parent 0564d34 commit 2c61ff7

File tree

1 file changed

+4
-5
lines changed

1 file changed

+4
-5
lines changed

document-similarity/document-similarity-logic/src/main/pig/document-similarity-s1-rank_filter.pig

+4-5
Original file line numberDiff line numberDiff line change
@@ -130,13 +130,12 @@ wc_ranked = load '$outputPath$WORD_RANK' as (rank_num:long,count:long,term:chara
130130
wc_ranked_hr = foreach wc_ranked generate rank_num,count,term;
131131
store wc_ranked_hr into '$outputPath$WORD_RANK_HR';
132132

133-
134133
--SPLIT wc_ranked INTO
135-
-- term_condition_accepted_tmp IF ($0 <= (double)tc.val*$removal_rate and $1 >= $removal_least_used),
136-
-- term_condition_not_accepted_tmp IF ($0 > (double)tc.val*$removal_rate or $1 < $removal_least_used);
134+
-- term_condition_accepted_tmp IF ($0 <= (double)tc.val*$removal_rate and $0 >= $removal_least_used),
135+
-- term_condition_not_accepted_tmp IF ($0 > (double)tc.val*$removal_rate or $0 < $removal_least_used);
137136

138-
term_condition_accepted_tmp = filter wc_ranked by ($0 <= (double)tc.val*$removal_rate and $1 >= $removal_least_used);
139-
term_condition_not_accepted_tmp = filter wc_ranked by ($0 > (double)tc.val*$removal_rate or $1 < $removal_least_used);
137+
term_condition_accepted_tmp = filter wc_ranked by ($0 <= (double)tc.val*$removal_rate and $0 >= $removal_least_used);
138+
term_condition_not_accepted_tmp = filter wc_ranked by ($0 > (double)tc.val*$removal_rate or $0 < $removal_least_used);
140139

141140
doc_selected_termsX = foreach term_condition_accepted_tmp generate FLATTEN(docs) as docId, term;
142141
store doc_selected_termsX into '$outputPath$WORD_COUNT';

0 commit comments

Comments
 (0)