blob: ee4e62682aeaf7b27538eb01d7d152cc7c3d2373 [file] [log] [blame]
Ian Maxon857dc132015-09-25 17:13:19 -07001/*
2 * Licensed to the Apache Software Foundation (ASF) under one
3 * or more contributor license agreements. See the NOTICE file
4 * distributed with this work for additional information
5 * regarding copyright ownership. The ASF licenses this file
6 * to you under the Apache License, Version 2.0 (the
7 * "License"); you may not use this file except in compliance
8 * with the License. You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing,
13 * software distributed under the License is distributed on an
14 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15 * KIND, either express or implied. See the License for the
16 * specific language governing permissions and limitations
17 * under the License.
18 */
Till Westmannfd733ee2014-07-10 00:57:37 -070019use dataverse TinySocial;
20
21set simfunction "jaccard";
22set simthreshold "0.3";
23
24for $msg in dataset MugshotMessages
25let $msgsSimilarTags := (
26 for $m2 in dataset MugshotMessages
27 where $m2.tags ~= $msg.tags
28 and $m2.message-id != $msg.message-id
29 return $m2.message
30 )
31where count($msgsSimilarTags) > 0
32order by count($msgsSimilarTags)
33limit 10
34return {
35 "message" : $msg.message,
36 "similarly tagged" : $msgsSimilarTags
37};