#PARSER CQL
#RUNQUERY
CREATE STREAM ml100k (userid Integer, itemid Integer, rating Double, timestamp Long)
WRAPPER 'GenericPull'
PROTOCOL 'CSV'
TRANSPORT 'File'
DATAHANDLER 'Tuple'
OPTIONS (
'filename' '${PROJECTPATH}/datasets/ml-100k/u_ordered.data',
'delimiter' '\t'
,'scheduler.delay' '100'
)
#RUNQUERY
CREATE STREAM ml100k_users (userid Integer)
WRAPPER 'GenericPull'
PROTOCOL 'CSV'
TRANSPORT 'File'
DATAHANDLER 'Tuple'
OPTIONS (
'filename' '${PROJECTPATH}/datasets/ml-100k/unique_temporal_ordered_users.data',
'delimiter' '\t'
,'scheduler.delay' '1000'
)
#PARSER PQL
#ADDQUERY
recommendationModels = RECOMMENDATION_LEARN(
{
item = 'itemid',
user = 'userid',
rating = 'rating',
learner = 'Mahout',
options = [
'OptionRecommender'='SVDRecommender',
'OptionFactorizer'='SVDPlusPlusFactorizer'
]
},
ml100k)
#ADDQUERY
recommendations = RECOMMENDATION(
{
recommender = 'recommender',
user = 'userid',
no_of_recommendations = 5
},
ml100k_users,
recommendationModels) |