blob: e4043067fd646af5414f514d6bed32c568d3c467 [file] [log] [blame]
Ian Maxon857dc132015-09-25 17:13:19 -07001/*
2 * Licensed to the Apache Software Foundation (ASF) under one
3 * or more contributor license agreements. See the NOTICE file
4 * distributed with this work for additional information
5 * regarding copyright ownership. The ASF licenses this file
6 * to you under the Apache License, Version 2.0 (the
7 * "License"); you may not use this file except in compliance
8 * with the License. You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing,
13 * software distributed under the License is distributed on an
14 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15 * KIND, either express or implied. See the License for the
16 * specific language governing permissions and limitations
17 * under the License.
18 */
alexander.behmc576c602012-07-06 02:41:15 +000019drop dataverse test if exists;
20create dataverse test;
21use dataverse test;
22
23create type DBLPType as closed {
24 id: int32,
25 dblpid: string,
26 title: string,
27 authors: string,
28 misc: string
29}
30
31create nodegroup group1 if not exists on nc1, nc2;
32
33create dataset DBLP(DBLPType)
ramangrover29669d8f62013-02-11 06:03:32 +000034 primary key id on group1;
alexander.behmc576c602012-07-06 02:41:15 +000035
36load dataset DBLP
Ian Maxonf18bba22015-08-21 12:35:14 -070037using "org.apache.asterix.external.dataset.adapter.NCFileSystemAdapter"
alexander.behmc576c602012-07-06 02:41:15 +000038(("path"="nc1://data/dblp-small/dblp-small-id.txt"),("format"="delimited-text"),("delimiter"=":")) pre-sorted;
39
40write output to nc1:"rttest/consolidate-complex-selects.aql";
41
42for $paper in dataset('DBLP')
43let $paper_tokens := word-tokens($paper.title)
44let $query_tokens := word-tokens("Transactions for Cooperative Environments")
45let $jacca := similarity-jaccard-check($paper_tokens, $query_tokens, 0.8f)
46let $jaccb := similarity-jaccard-check($paper_tokens, $query_tokens, 0.5f)
47let $jaccc := similarity-jaccard-check($paper_tokens, $query_tokens, 0.3f)
48where $jacca[0] and $jaccb[0] and $paper.authors = "testauth" and $jaccc
Ian Maxon857dc132015-09-25 17:13:19 -070049return {"Paper": $paper_tokens, "Query": $query_tokens }