blob: 4c41d626ea43b74d2c888d05f510dd24a6312de2 [file] [log] [blame]
Yingyi Bu391f09e2015-10-29 13:49:39 -07001/*
2 * Licensed to the Apache Software Foundation (ASF) under one
3 * or more contributor license agreements. See the NOTICE file
4 * distributed with this work for additional information
5 * regarding copyright ownership. The ASF licenses this file
6 * to you under the Apache License, Version 2.0 (the
7 * "License"); you may not use this file except in compliance
8 * with the License. You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing,
13 * software distributed under the License is distributed on an
14 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15 * KIND, either express or implied. See the License for the
16 * specific language governing permissions and limitations
17 * under the License.
18 */
19
20drop database twitter if exists;
21create database twitter;
22
23use twitter;
24
25
26create type twitter.Tweet as
27{
28 id : int32,
29 tweetid : int64,
30 loc : point,
31 time : datetime,
32 text : string
33}
34
Ian Maxonf7b64532015-12-09 17:28:18 -080035create external table TwitterData(Tweet) using "org.apache.asterix.external.dataset.adapter.NCFileSystemAdapter"(("path"="asterix_nc1://data/twitter/smalltweets.txt"),("format"="adm"));
Yingyi Bu391f09e2015-10-29 13:49:39 -070036
Ian Maxonf7b64532015-12-09 17:28:18 -080037write output to asterix_nc1:"/tmp/count-tweets.adm"
Yingyi Bu391f09e2015-10-29 13:49:39 -070038select element {'word':tok,'count':twitter.count(token)}
39from TwitterData as t,
40 tokens as token
41with tokens as twitter."word-tokens"(t.text)
42group by token as tok
43;