blob: 4427369eeaabafa9e670cede78bf9d0185fed504 [file] [log] [blame]
drop dataverse test if exists;
create dataverse test;
use dataverse test;
create type AddressType as closed {
number: int32,
street: string,
city: string
}
create type CustomerType as closed {
cid: int32,
name: string,
age: int32?,
address: AddressType?,
interests: {{string}},
children: [ { name: string, age: int32? } ]
}
create nodegroup group1 if not exists on nc1;
create dataset Customers(CustomerType)
partitioned by key cid on group1;
load dataset Customers
using "edu.uci.ics.asterix.external.dataset.adapter.NCFileSystemAdapter"
(("path"="nc1://data/semistructured/co1k/customer.adm"),("format"="adm"));
create index interests_index on Customers(interests) type fuzzy keyword;
write output to nc1:"rttest/index-selection_fuzzy-inverted-index-ulist-jaccard.adm";
for $c in dataset('Customers')
let $jacc := similarity-jaccard-check($c.interests, ["databases", "computers", "wine"], 0.7f)
where $jacc[0]
return $c