http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/c013f617/userguide/search_index.json
----------------------------------------------------------------------
diff --git a/userguide/search_index.json b/userguide/search_index.json
index 2a1757c..9938512 100644
--- a/userguide/search_index.json
+++ b/userguide/search_index.json
@@ -1 +1 @@
-{"index":{"version":"0.5.12","fields":[{"name":"title","boost":10},{"name":"keywords","boost":15},{"name":"body","boost":1}],"ref":"url","documentStore":{"store":{"./":["(asf),","adadelta.","adapt","algorithm","analyt","anomali","apach","architectur","art","batch","build","built","classification,","collect","confid","consid","conversely,","cross","data","design","detection,","eas","effort","engineering.","factor","featur","foundat","function","functionalities:","functions.","hive","hive/pig.","hivemal","incub","incubator.","interface.","introduct","k","learn","learning;","librari","machin","machines,","mainli","model","nearest","neighbor,","number","offer","pig","platform","predict","provid","queri","recommendation,","regression,","regular","run","runtime.","soft","softwar","spark","spark/pig,","sponsor","state","such","support","through","thus,","udf/udaf/udtf","undergo","us","varieti","vectors,","versatil","weight","weighted,"],"getting_started/":["(asf),","apach","effort","founda
 
t","get","hivemal","incub","incubator.","softwar","sponsor","start","summari","undergo"],"getting_started/installation.html":["$","$home/.hiverc","(asf),","./target.","/home/myui/tmp/defin","/home/myui/tmp/hivemal","/tmp/defin","/tmp/hivemal","7","add","all.hiv","all.hive;","alternatively,","apach","automat","bin/build.sh","build","cd","choic","clone","command","core","defin","dependencies.jar","dependencies.jar;","docker","each","effort","file.","find","follow","foundat","function","git","hadoop","hive","hivemal","hivemall.git","https://github.com/apache/incub","incub","incubator.","instal","jar","java","later","line","load","pig","platforms:","prerequisit","run","session.","softwar","sourc","spark","sponsor","start","test","then,","time","time.","two","undergo","v0.13","v2.4.0","xxx"],"getting_started/permanent-functions.html":["\"hivemall.\"","\"hivemall.*\";",";(asf),","/apps/hivemal","/tmp/defin",">","apach","auxiliari","avoid","call","case","cautiony","confirm","creat","databas
 
","database.","databases,","ddl","default","defin","dependencies.jar","dependencies.jar;","each","effort","exist","first,","follow","follows:","foundat","fs","function","hadoop","hdf","hive","hivemal","hivemall.","hivemall.adadelta","hivemall.adagrad","hivemall;","hiveserv","hivevar:hivemall_jar=hdfs:///apps/hivemall/hivemal","incub","incubator.","instal","jar","later","live","load","mkdir","need","non","p","perman","permanent.hive,","permanent.hive;","prefix","put","queri","scheme,","script","session.","sessions.","set","show","softwar","sourc","specifi","sponsor","step","support","then,","through","udf","udfs.","undergo","us","v0.13"],"getting_started/input-format.html":["\"0\"","\"0:1.0\"","\":\",","\"dog\"","\"height:1.5\"","\"length:2.0\"","\"length:2.0\")","\"name\"),","\"weight\"),","\"xxxxxxx","(","(+1)","(=16777216)","(a.k.a.","(asf),","(binari","(call","(cf.","(e.g.,","(for","(i.e.,","(int","(or","(v0.3.1","(we","(weight)",")","),",");","...)","0","0,","0.0","0.0f","1","1)
 
","1),","1,","1.","1.0","1.0,","1.0.","1.0f","10:3.4","123:0.5","16777216.","2","2^24","3)","34567:0.231","43352:55.3","55.0","55.0);",":","::=","[\"1:3.0\",\"2:4.0\",\"3:5.0\"]","[\"apple:1.0\",\"value:120.3\"]","[\"is_cat#1\",\"is_dog#0\",\"is_lion#1.0\",\"is_pengin#true\",\"species#dog\"]","[10,7,9]","accept","actual","ad","add_feature_index","add_feature_index(array(3,4.0,5))","addbia","addit","alternatively,","apach","append","appli","argument","arguments:","array","array<int|bigint|text>","array(\"bias:1.0\"),","array(\"height\",","array(\"height:1.5\",","array(\"id\",","array(\"is_cat\",\"is_dog\",\"is_lion\",\"is_pengin\",\"species\"),","articl","befor","between","bia","bias/dummi","bigint)","bigint,","binari","call","cast","cast(target","categor","categorical_features(","categorical_features(array","class","class)","classif","classifi","click_or_not","column","column.","common","compat","compress","concat(\"weight\",\":\",55.0);","concat(mhash(extract_feature(\"xxxxxxx",
 
"concat_array(","consid","convert_label(","convert_label(0.0f),","convert_label(1),","convert_label(1.0f)","creat","data","default","denot","describ","detail.","dimens","don't","doubl","dual;","dummi","e.g.","each","ebnf","effort","element","entry.","exampl","example,","example.","example:","examples.","except","explain","explanatori","explicitli","extract_feature(\"weight:55.0\"),","extract_weight(\"weight:55.0\");","extract_weight(\"xxxxxxx","featur","feature(\"weight\",","feature(mhash(extract_feature(\"xxxxxxx","feature_index(array(\"10:0.2\",\"7:0.3\",\"9\"));","featurenames,","features)","features,","features.","first","fit","float","float)","follow","follows:","format","format.","format:","foundat","function","function)","function.","gener","general,","hand,","happens.","hash","hashing/hash","height,","helper","here","here,","hivemal","hivemall.","huge","hyperparameters).","id,","import","incub","incubator.","index","index)","index.","input","instanc","int","int,","label","la
 
bel,","label.","large.","later","later)","later,","learning.","less","libsvm","logist","long","machin","memori","mention","mhash","model","multi","name","need","neg","normal","notat","note","note:","number","number.","numbers,","omit","option","outofmemori","page","pleas","posit","predict","prepar","primit","probabl","produc","provid","quantit","quantitative_features(","quantitative_features(array","quantitative_features(array(\"apple\",\"value\"),1,120.3);","rang","real","refer","regress","regression)","regression,","regression.","repres","reserv","respectively.","respons","response/predictor","row","rowid()","rowid,","scheme","select","setting.","similar","softwar","spaces,","spars","specif","specifi","sponsor","start","statistics).","statistics,","storage)","support","tabl","table.","table;","take","target","target)","target.","text","text.","through","train","trick","true,","two","type","typically,","undergo","us","usual","v0.3","v0.3,","v0.3.2","v0.4.0","valu","variabl","variab
 
le,","variable.","variables.","vector","veri","vowpal","wabbit.","weight","weight.","weight:55.0","weight:55.3\")","weight:55.3\"))","weight:55.3\")),","yyyyyi","|"],"tips/":["(asf),","apach","effect","effort","foundat","hivemal","incub","incubator.","softwar","sponsor","tip","undergo"],"tips/addbias.html":["\"0\"","(\"","(0,0).","(1,1)","(2,2)","(asf),","(feature,weight)","(or","(select",")","1\"","ad","add","addbias()","addbiasudf","alway","apach","avg(weight)","b","b,","becuas","befor","better","bia","both(important!)","cast(split(feature,\":\")[1]","claus","clause,","consid","creat","cross","data","dataset","default.","detail.","divid","e2006tfidf_pa1a_model","e2006tfidf_test","e2006tfidf_test_explod","e2006tfidf_train_x3","effort","enabl","examples.","exist","explicit","explode(addbias(features))","express","extract_feature(feature)","extract_weight(feature)","f(x)","f(x).","f(x)=wx+b","f(x)=y,","featur","feature,","feature;","float)","follow","follows.","form","found","foundat
 
","function","group","hivemal","hivemall,","hyperplan","incub","incubator.","label","later","learn","make","model","note","origin","origin.","pa1a_regress(addbias(features),target)","point","predict","regularization),","rowid,","see","select","softwar","split(feature,\":\")[0]","sponsor","t","tabl","target,","test","then,","train","trainer","training/test","undergo","us","v0.3)","v0.3.1","valu","vector.","view","w,","weight","without","x","y","y=f(x)=wx"],"tips/rand_amplify.html":["${shufflebuffersize}","${shufflebuffersize},","${xtimes}","(","(0.743392)","(0.746214)","(a","(asf),","(copy)","(e.g.,","(external)","(feature,weight)","(rowid,","(sec)","(select",")","*","*)","0.734805","0.743392","0.746214","1","100","116.424","2","2012,","3.","479.855","89.718","abov","accuraci","actual","algorithm","amplifi","amplifier+clust","amplify(${xtimes},","amplify()","apach","argument","articl","auc","avoid","becom","below:","better","bottleneck","bottleneck.","buffer","cast(avg(weight)","caus
 
","claus","cluster","conclus","converg","creat","cup","data,","deal","definit","descent)","distribut","each","effect","effici","effort","elaps","enumer","even","exampl","example)","example,","example.","examples,","execut","explain","factor","factor.in","feature,","feature;","features)","file","filled.","first","float)","follow","follows:","foundat","function","good","gradient","group","hdfs.","higher","hivemal","hivevar:shufflebuffersize=1000;","hivevar:xtimes=3;","however,","improv","in/out","incub","incubator.","input","instance.","instead","involv","iter","iterations.","job","job.","kdd","key","key.","known","label,","larg","learn","local","logress(features,label)","lr_model_x3","m/r","machin","mandatori","map","mapreduc","merg","method","models.","more","multipl","need","note","oper","order","output","phase","plain","predict","problem","problem.","provid","queri","rand();","rand_amplifi","rand_amplify(${xtimes},","rand_amplify()","rand_amplify(),","random","randomli","reason","
 
recommend","record","reduc","replac","requir","result","return","row","row.","score.","select","set","sever","show","shown","shuffl","shuffled.","similar","singl","slow","small","so,","softwar","sort!","spark","specifi","sponsor","stage","steps.","stochast","suit","t","tabl","task","task.","tasks,","techniqu","then,","through","time","time.","track","train","training_orcfil","training_orcfile;","training_x3","trainning_x3","udtf","undergo","us","user","variants.","veri","view","weight","within","without"],"tips/rt_prediction.html":["\"\\n\"","\"\\t\"","$sqoop_home/lib.","'\\n'","'\\t'","'a9a_model1_tsv'","'features'","'sqoop';","'sqoop'@'%'","'t'","(","(/etc/mysql/my.conf)","(0,1,10)","(0,1,10);","(0.00","(1.0","(asf),","(feature);","(i.e.,","(jdbc","(option","(rowid)","(t.featur",");","*","+","/","//","/user/hive/warehouse/a9a.db/a9a_model1_tsv","/user/hive/warehouse/a9a.db/a9atest_exploded_tsv","0","0.0","0.0)","0.05595205126313402","0.1310696931351625","0.21053194999694824","0.5,
 
","0.5761121511459351","1","1.0","1.0).","1.0,","1.4.5","1.5259535312652588","10","10;","12427","12427;","12428","16","2.6.","3","3;","5","67","7","73","74","76","82","83",";","=",">","\\","a9a","a9a.*","a9a;","a9a_model1","a9a_model1;","a9a_model1_feature_index","a9a_model1_tsv","a9a_model1_tsv;","a9atest","a9atest_explod","a9atest_exploded_rowid_index","a9atest_exploded_tsv","a9atest_exploded_tsv;","abov","access","achiev","add","alreadi","alternatively,","apach","article,","assum","batch","be","begin","better","bigint,","bin/sqoop","binari","bind_address","boost","btree;","build","build.xml","carri","categor","check","classif","column","configur","connect","connector","creat","data","databas","dbms.","defin","delimit","desc","dir","directori","do","doubl","double)","driver)","drop","each","edit","effort","end;","entri","exist","exp(","explain","explode(addbias(features))","export","exported.","extend","extract_feature(feature)","extract_weight(feature)","featur","feature,","featu
 
re;","field","file","find","finishes,","flush","follows:","forget","format","foundat","function","grant","hadoop","hadoop.","hadoop_common_home=${hadoop_home}","hadoop_conf_dir=${hadoop_home}/etc/hadoop/","hadoop_home=/opt/hadoop","have","hdf","here","hive","hive,","hive.","hivemal","however,","id","identifi","if(sigmoid(sum(t.valu","import","incub","incubator.","index","input","int,","itself","ivy.xml","java.jar","jdbc:mysql://${mysql_host}/a9a","join","label,","languag","later","learn","left","limit","line","list","locat","location:hdfs://dm01:9000/user/hive/warehouse/a9a.db/a9a_model1_tsv","location:hdfs://dm01:9000/user/hive/warehouse/a9a.db/a9atest_exploded_tsv,","logist","lookup","m","m.featur","m.feature)","m.weight))","master","model","mysql","mysql.","mysql>","mysql_host=dm01","need","node","onlin","online/r","online/realtim","outer","packag","particular","password","patch.","predict","prediction.","prepar","prerequisit","privileg","privileges;","prob","prob,","probabl","pr
 
ocess","process;","provid","put","query.","rdbm","read","real","recommend","regress","relat","return","row","rowid","rowid,","rowids.","run","scheme","sec)","select","server","set","shown","sigmoid","sigmoid(sum(m.weight))","sigmoid(sum(t.valu","sigmoid(x","sigmoid;","similar","simpli","slave","so,","softwar","sponsor","sql","sqoop","sqoop.","step)","store","successfulli","support","t","t.rowid","tabl","table,","tables.","target","task.","termin","test","textfil","then,","time","transact","tsv","undergo","uniqu","us","user","usernam","v2.6.0.","valu","view","way","weight","x));","|"],"tips/ensemble_learning.html":["(","(asf),","(label,feature,weight)","(label,feature,weight,covar)","(select","(t.featur","(t.rowid",")","*","/home/myui/tmp/defin","/home/myui/tmp/hivemall.jar;","0.8474830954169797","0.8482344102178813","0.8494866015527173","0.8499874780866516","0.850488354620586","1;",":","=","==","[case1]","[case2]","accuraci","actual","actual,","add","algorithm","all.hive;","apach","
 
argmin_kld(feature,","arow","better","broth","case","cast(featur","clean","cnt","cook","count(1)","count(1)/3993","covar)","creat","cw","default","delet","drop","effort","ensembl","ensemble(model)","ensemble(prediction)","ensemble/mix","evalu","exampl","explain","feature,","feature;","foundat","group","head","hive.exec.parallel.thread.number=8;","hive.exec.parallel=false;","hive.exec.parallel=true;","hivemal","hivemall.two","incub","incubator.","int)","jar","join","label","label)","label,","later","learn","learning.","left","let'","m","m.col0","m.col1","m.feature)","m.label","m.label,","mani","mapred.reduce.tasks=","mapred.reduce.tasks=4;","maxrow(cnt,","maxrow(score,","model","news20mc_arow_predict1","news20mc_cw_predict1","news20mc_ensemble_model1","news20mc_ensemble_model1;","news20mc_ensemble_predict1","news20mc_ensemble_predict1;","news20mc_ensemble_submit1","news20mc_ensemble_submit1;","news20mc_pred_ensemble_predict1","news20mc_pred_ensemble_submit1","news20mc_scw2_predict1",
 
"news20mc_test","news20mc_test_explod","news20mc_train_x3","one?","outer","pd","pd.label","pd.rowid);","predict","predicted;","prepar","replac","reset","rowid","rowid,","run","score","score,","scw2","select","set","softwar","sourc","spoil","sponsor","stabl","sum(m.weight","t","t.label","t.rowid,","t.value)","t1","t2","t2;","t3;","tabl","train","train_multiclass_arow(addbias(features),label)","train_multiclass_cw(addbias(features),label)","train_multiclass_scw(addbias(features),label)","udf","undergo","unfortunately,","union","v0.1","v0.2","verifi","view","voted_avg(weight)","weight"],"tips/mixserver.html":["\"","#","(3","(asf),","(feature,weight)","(mix","(netty,jsr305)","(select","(w/","(w/o",")","./run_mixserv.sh","0.844835019263103","0.8678096499719774","11212","32","5","abov","access","accuraci","ad","apach","assum","asynchron","better","bin/run_mixserv.sh","block","brief","cast(voted_avg(weight)","caution:","certain","classifiers.","cluster","commun","configur","contain","conve
 
rg","creat","current","dataset.","default","dependencies.jar","design","detail","due","effect","effici","effort","enabl","enough","exampl","experience,","explain","explan","fast","faster","feature,","feature;","file","find","first,","float)","follow","follows:","foundat","furthermore,","gbe","group","hadoop","handl","hive.","hivemal","hivemall.","horizont","host01,","host01,host02,host03\")","host03","host03.","i/o.","improv","incub","incubator.","instal","installation.","intern","jar","kdd10a_pa1_model1","kdd10a_train_x3","kdd2010;","kdd2010a","larg","later","make","minimum","mix","mix\"","mix)","mix).","mixing.","mixserv.jar","mixserver.java","model","multipl","neglig","networking.","node","nodes.","nodes:","non","normal","now,","option","options.","overhead","pa1","page,","perform","port","port\"","predict","prerequisit","protocol","put","query.","recommend","requir","run","run_mixserv.sh.","scalabl","see","seen","select","server","server(s)","server)","servers.","set","simpl","s
 
ize","size).","slide.","softwar","sponsor","standard","sure","t","tabl","target/hivemal","though.","through","throughput","thu","time","train","train_pa1(addbias(features),label,\"","undergo","us","v0.3","weight","worker"],"tips/emr.html":["\"","\",\"","\"hive","\"hivemal","\"instal","\"instance.ismaster=true,s3://${s3bucket}/emr/conf/emr_hivemall_bootstrap.sh\"","\"instance.ismaster=true,s3://mybucket/emr/conf/emr_hivemall_bootstrap.sh\"","${s3bucket}/datasets/news20b/[train|test].","${s3bucket}/emr/conf","${s3bucket}/emr/log","${s3bucket}/emr/output","'\\n'","'\\t'","'s3://${s3bucket}/emr/outputs/news20b_arow_model1';","'s3n://${s3bucket}/datasets/news20b/test';","'s3n://${s3bucket}/datasets/news20b/train';","(","(arow)","(asf),","(emr).http://docs.aws.amazon.com/elasticmapreduce/latest/developerguide/emr",";(feature,weight)","(rowid,","(select","(t.featur","(t.rowid",")","*","*)","./elast","./tmp/defin","./tmp/hivemall.jar;","0.0","0.175","0.35","0.7","0.9659727782225781","1","100
 
","1000,","1a","2","3","3.0.0\".","8","=","==",">","\\","action","actions/configur","actions/instal","actions/run","actual","actual,","adapt","add","aliv","all.hive;","amazon","ami","amplify(3,","ap","apach","arg","array","avail","befor","best","bid","bootstrap","both","c,fs.s3n.multipart.uploads.enable=true,","c,fs.s3n.multipart.uploads.split.size=67108864\"","case","cast(rand(47)","cast(rand(49)","cast(rand(50)","cast(split(feature,\":\")[0]","cast(split(feature,\":\")[1]","cast(voted_avg(weight)","cheap","clean","cli","client","cluster","cluster\"","collect","core","core/task","count","count(1)/4996","creat","data","databas","debug","default","delimit","drop","e.g.,","effort","elast","emr","emr_hivemall_bootstrap.sh","enabl","end","evalu","exist","explode(addbias(features))","extern","featur","feature,","feature;","features)","field","float","float)","follows.","follows:","format","foundat","ganglia","ganglia\"","group","gui","hadoop","hadoop,","hive","hive.html","hivemal","hivev
 
ar:s3bucket=your_bucket_name;","i'm","incub","incubator.","input","insert","instanc","instead","int)","int),","int);","int,","interact","item","jar","job","job,","join","label","label,","larg","later","latest","launch","learn","left","line","locat","log","lunch","m","m,mapred.child.java.opts=","m,mapred.tasktracker.map.tasks.maximum=7,","m,mapred.tasktracker.reduce.tasks.maximum=2,","m.feature)","m1.larg","m1.medium","m1.xlarg","mapred.max.split.size=67108864;","mapreduc","master","mode.","money.","name","news20;","news20b_arow_model1","news20b_arow_model1;","news20b_arow_predict1","news20b_arow_predict1;","news20b_arow_submit1","news20b_arow_submit1;","news20b_test","news20b_test_explod","news20b_train","news20b_train;","news20b_train_x3","northeast","old","optionally,","or,","outer","output","overwrit","pd","pd.label","pd.rowid);","predict","predicted;","prepar","prerequisit","price","put","rand_amplify(3,","recommend","regular","replac","row","rowid","rowid,","run","s3,","s3://el
 
asticmapreduce/bootstrap","s3://mybucket/emr/log","s3n://${s3bucket}/emr/log","save","select","set","setup\"","site.xml","site=s3://${s3bucket}/emr/conf/h","size","softwar","sourc","specifi","split","sponsor","spot","store","string,","sum(m.weight","t","t.label","t.rowid,","t.rowid;","t.value)","tabl","task","termin","test","textfil","then,","through","tip","total_weight,","train","train_arow(addbias(features),label)","tsv","type","undergo","uri","us","user","usual","valu","vector","version","view","way","weight","wizard.","work","xmx1536m,","yarn","yarn.","zone"],"tips/general_tips.html":["(asf),","apach","effort","foundat","gener","hive/hadoop","hivemal","incub","incubator.","softwar","sponsor","tip","undergo"],"tips/rowid.html":["${sequence_number}","${task_id}","'","'')","',","()","(asf),","*","..;","a9atest;","ad","also,","anoth","apach","becom","creat","dataset","each","effort","execut","foundat","function","gener","hivemal","however,","incub","incubator.","larg","later.","lon
 
g","option","over","provid","queri","rc.1","reducer.","regexp_replace(reflect('java.util.uuid','randomuuid'),","return","row","row_number()","row_number().","rowid","rowid()","rowid,","rownum()","scheme","select","singl","slow","softwar","sponsor","sprintf(`%d%04d`,sequence,taskid)","sql","string","support","tabl","undergo","uniqu","us","v0.2","v0.5","xxx","xxx;"],"tips/hadoop_tuning.html":["\"","(1","(2^24","(asf),","(assum","(e.g.,","(float)","(heuristics)","(iff","(mr","(short)","(use","(yarn)","*","0.5","0.6)","1.2","1024mb","161mb","2","2048","2048mb","2^24","2^25","2^25)","4","820","820mb","=","abov","amplify()).","apach","avail","byte","calculated)","case.","chang","compon","configur","consum","covari","default)","default.","dens","densemodel\"","effort","engin","estim","execut","feature_dimens","follow","follows:","formula","foundat","guid","hadoop","hash","here","hive","hive.execution.engine=mr;","hive.execution.engine=tez;","hivemal","hivemall.","http://hadoopbook.com/","h
 
ttp://www.slideshare.net/cloudera/mr","import","incub","incubator.","io.sort.mb=1024","larg","make","mapper","mapper.","mapred.job.reduce.input.buffer.percent=0.2","mapred.map.child.java.opts=\"","mapred.reduce.child.java.opts=\"","mapred.reduce.shuffle.input.buffer.percent=0.6","mapreduc","mapreduce.framework.name=yarn","mapreduce.framework.name=yarn;","mapreduce.map.java.opt","mapreduce.map.java.opts=\"","mapreduce.reduce.input.buffer.percent)","mapreduce.reduce.input.buffer.percent=0.2","mapreduce.reduce.java.opt","mapreduce.reduce.java.opts=\"","mapreduce.reduce.shuffle.input.buffer.percent=0.6","mapreduce.task.io.sort.mb","mapreduce.task.io.sort.mb=1024","max","mb","memori","model","model,","model.","moreover,","note:","old","option","perf","plain","pleas","possible.","predict","prerequisit","queries.","rand_amplify()).","recommend","reduc","reducer.","refer","represent","run","set","setting:","side","so,","softwar","spaceefficientdensemodel","spaces.","spars","sponsor","table)
 
","tez","tez;","train","tune","tuning:","undergo","us","used,","v1)","xmx2048m","xx:+printgcdetails\"","≈"],"troubleshooting/":["(asf),","apach","effort","foundat","hivemal","incub","incubator.","softwar","sponsor","troubleshoot","undergo"],"troubleshooting/oom.html":["(a","(asf),","(mapred.child.java.opts/mapred.map.child.java.opts)","amplify(),","apach","befor","caus","certain","cloud","default","due","dure","each","effort","error","exampl","first","fit","foundat","hadoop","happen","hivemal","hivemall.","increases)","incub","incubator.","input","instead.","larg","larger","mapper","mapred.max.split.s","mapred.max.split.size=67108864;","mapred.reduce.task","mapred.reduce.tasks=64;","memory.","merg","middl","model","number","oom","outofmemoryerror","parameters.","possible.","rand_amplify()","reduc","revis","set","setting,","shuffle/merg","shuffle/reduc","size","smaller","softwar","split","sponsor","step,","still","that,","then,","train","trainer","training.","tri","undergo","us","v
 
alu"],"troubleshooting/mapjoin_task_error.html":["(asf),","0.11.0,","apach","auto","befor","complex","convers","default.","disabl","effort","enabl","error:","except","execut","follows.","foundat","gener","hive","hive.auto.convert.join","hive.auto.convert.join=false;","hivemal","incub","incubator.","join","map","object","object.","queri","semanticexcept","semanticexception,","serial","set","softwar","sometim","sponsor","task","throw","undergo","us","views,","workaround"],"troubleshooting/asterisk.html":["(asf),","4181","alia","alias,","apach","argument","asterisk","effort","explicitly.","fix","foundat","hive","hivemal","incub","incubator.","name","part","possibl","release.","see","softwar","specifi","sponsor","tabl","udtf","undergo","us","v0.12","without","work","workaround","working."],"troubleshooting/num_mappers.html":["#","(asf),","(i.e.,","2.x","apach","block","configur","control","default","default.","effort","foundat","give","hadoop","hdfs)","hive.input.format","hive.input.for
 
mat.","hive.input.format=org.apache.hadoop.hive.ql.io.hiveinputformat;","hive.tez.input.format;","hive.tez.input.format=org.apache.hadoop.hive.ql.io.hiveinputformat","hivemal","incub","incubator.","input","less","mapper","mapreduce.job.maps=128;","maximum","note","number","org.apache.hadoop.hive.ql.io.combinehiveinputformat.","org.apache.hadoop.hive.ql.io.hiveinputformat","set","setting:","size","softwar","split","sponsor","table.","tez","tri","undergo","us","via"],"troubleshooting/mapjoin_classcastex.html":["(asf),","1.3.0.","[workaround]","apach","array","caus","caution:","classcastexcept","column(s).","contain","detail.","effort","fix","follows:","foundat","hive","hive.mapjoin.optimized.hasht","hive.mapjoin.optimized.hashtable=false;","hive_11051","hivemal","incub","incubator.","join","map","refer","serial","set","side","softwar","sponsor","tabl","tez","tri","undergo"],"misc/generic_funcs.html":["\"normal\",","(1.0","(asf),","(default),","(or","(æ
 ª)トンドルiii","*)","+","..)
 
","/","0).","0.0f|1.0f","0.0f|1.0f,","1","1,9]","1.0","1|1","2","2);","2,1,3,10]","2,10));","2,4);","3","3);","4","5","6","7","8","9","9223372036854775808]","=",">",">[14,","[","[\"aaa\"]","[\"kuromoji\",\"使う\",\"分かち書き\",\"テスト\",\"第\",\"二\",\"引数\",\"normal\",\"search\",\"extended\",\"指定\",\"デフォルト\",\"normal\",\"","[,","[1,2,3,4]","[1,2,3]","[2,3,4]","[3,4]","[3]","aa+=kaim|wtt!+wbgaa","aaaaaaaaaaaaaaaabbbbccc","aggreg","apach","argument","array","array.","array_avg(array)","array_concat(array","array_concat(array(1),array(2,3));","array_intersect(array","array_intersect(array(1,3,4),array(2,3,4),array(3,5));","array_remove(array","array_remove(array(\"aaa\",\"bbb\"),\"bbb\");","array_remove(array(1,null,3),array(null));","array_sum(array)","articl","b1,","b2,","base91","base91(binary)","base91(deflate('aaaaaaaaaaaaaaaabbbbccc'));","between","binari","bits_collect(int|long","bits_or(array","bitset","bitset)","boolean","cmpkey,","column","comp
 
ress","compresseddata)","compressionlevel])","concaten","const","contain","convert","convert_label(const","data","decompress","deflate(text","deflater.","describ","detail.","doubl","duplic","each","each_top_k(int","effort","element","elimin","end","end)","english","englishtext","exclus","exp(","float)","form","form.","form])","foundat","fromindex","fromindex,","function","functions.","gener","generate_serics.","generate_series(1,9);","generate_series(const","give","given","group,","hivemal","http://www.postgresql.org/docs/current/static/funct","id","inclus","incub","incubator.","index","indexes)","inflat","inflate(binari","inflate(unbase91(base91(deflate('aaaaaaaaaaaaaaaabbbbccc'))));","int","intersect","int|bigint","int|const","int|text","int|text|array","is_stopword(str","k","k,","key","key)","keys)","last","less","level","line","list","logic","long","long[]","map","map_get_sum(map","map_tail_n(map","mapred.task.partit","mapreduc","math","mean","mode","n","n)","natur","nfc","nfd,"
 ,"nfkc,","nfkd","normal","normalize_unicode('㈱㌧㌦â…
²','nfkc');","normalize_unicode('ハンカクカナ
','nfkc');","normalize_unicode(str","number","object","on","order","origin","original,","orignal,","page","postgresql'","process","pseudo","queri","rang","refer","regex])","remov","represent","retriev","return","reverseorder=false])","row","rowid()","select","sequenc","seri","set","sigmoid(x)","similar","slice","softwar","sort","sort_and_uniq_array(array(3,1,1,","sort_and_uniq_array(array)","specifi","split","split_words(str","sponsor","src","src,","srf.html","start","start,","stoptags])","stopword","stopwords,","str","string","subarray(array","subarray(array(1,2,3,4,5,6),","subarray_endwith(array","subarray_endwith(array(1,2,3,4),","subarray_startwith(array","subarray_startwith(array(1,2,3,4),","sum","tail","take","target","target)","taskid()","text","to_bits(array(1,2,3,128));","to_bits(int[]","to_map(key,","to_ordered_map(key,","toindex","toindex)","token","tokenize(str","to
 
kenize_ja(\"kuromojiを使った分かち書きのテストです。第二引数にはnormal/search/extendedを指定できます。デフォルトではnormalモードです。\");","tokenize_ja(str","tolowercase])","top","transform","two","type","udaf","udf","unbase91(string)","unbits(bits_or(to_bits(array(1,4)),to_bits(array(2,3))));","unbits(long[]","unbits(to_bits(array(1,4,2,3)));","undergo","up","us","valu","value)","values,","whether","word","word)","x)","x))","x1,","x2,","x_rank(key)","{sequence_number}","{task_id}","ハンカクカナ","モード\"]"],"misc/topk.html":["${k},","(","(asf),","(e.g.,","(int","(partit","(rank,",")","),","*","..","..,","...,","0","0,","0.2","0.4","0.4383084177970886","0.43862903118133545","0.4398220181465149","0.44030147790908813","0.4408798813819885","0.44112563133239746","0.4415401816368103","0.44166821241378784","0.4422193765640259","0.4424300789833069","0.44254064559936523","0.44283604621887207","0.4429032802581787","0.4432108402252197","0.
 
44323229789733887","0.4435907006263733","0.4442034363746643","0.44569307565689087","0.4460843801498413","0.4464914798736572","0.45163780450820923","0.45244503021240234","0.4525672197341919","0.4527127146720886","0.45314133167266846","0.6","0.8","0.8205751180648804","0.822281539440155","0.8241575956344604","0.8255619406700134","0.8271955251693726","0.8301891088485718","0.8328862190246582","0.8340602517127991","0.8344510793685913","0.8390793800354004","0.8438876867294312","0.8439178466796875","0.8463355302810669","0.8467264771461487","0.8499397039413452","0.8516314029693604","0.8562054634094238","0.856602132320404","0.8585299849510193","0.8594650626182556","0.9480557441711426","0.9493276476860046","0.9531533122062683","0.9536819458007812","0.9761330485343933","1","1,","10","10,","100),","10143","10242","10514","10922","10;","11073","11719","12","14073","15173","17218","17582","17782","18541","18556","19468","2","2,","20400","21009","21115","21125","21595","21657","22006","22853","2315
 
0","23386","24289","24413","25","2513","25141","25364","25977","26220","27121","3","34","3786","4","5","50","6","60","6598","7","70","7041","7326","7503","8","80","8018","8477","8697","9","90","900","9008","943","9881","=","`each_top_k`","accept","addit","altern","alway","amount","angular_similarity(features1,","angular_similarity(t2.features,","apach","appli","arg1,","arg2,","argn)","argn).","argn.","argument","asc,","assum","avoid","b","base_id","base_id,","benef","by)","cases.","caution","cautioneach_top_k","certain","class","class,","claus","click","clicks,","cluster","column","compar","comparison.","complex","comput","consid","consist","creat","cross","crucial","data.","dense_rank","desc)","desc;","differ","distribut","doubl","each","each_top_k","each_top_k(","each_top_k(${k},","each_top_k(int","each_top_k.","effici","efficiently.","effort","ensur","environ","explicit","extens","fast","featur","features1,","features2),","features2,","follow","follows:","foundat","function","get
 
","group","group,","group.","hanld","help","hive","hive.","hivemal","hivevar:k=","hivevar:k=10;","hivevar:k=5;","http://stackoverflow.com/questions/9390698/h","id","id)","id,","id1","id1,","id2,","if(valu","incub","incubator.","input","instead.","interact","involv","item","join","k","k,","k.","key","larg","large.","later.","left","length","less","limit","list","mandatori","mani","massiv","method","mytabl","n","neighbor_id","neighbor_id,","note","noteclust","null","null,","null.","number","o(nm).","or,","order","other_id,","outer","output","over","page","parallel","particularli","process","pseudo","queri","query/32559050#32559050","rand(31)","rank","rank()","rank,","rank/distribut","record","relat","requir","result","return","revers","rnd","rnd,","run","s01","s02","s03","s04","s05","s05;","scheme","score","score,","select","semant","set","signatur","similar","similarity,","similarity/dist","slightli","softwar","sort","sponsor","sql","sql'","standard","student","student)","student,","
 
support","suppos","synonym","t","t01","t02","t03","t04","t05","t1","t1.featur","t1.features),","t1.i","t1.id","t1.id,","t1;","t2","t2.featur","t2.id","t2.id,","t;","tabl","tail","take","test_hivemal","test_rnd","that.","then,","third","timestamp","top","train_hivemal","type","udtf","undergo","union","us","usag","user","v0.3.2","valu","value)","value,","value.","variabl","veri","way","whre","window","x","y","y)"],"misc/tokenizer.html":["\"normal\",","(asf),","/tmp/defin","/tmp/hivemal","=","[\"kuromoji\",\"使う\",\"分かち書き\",\"テスト\",\"第\",\"二\",\"引数\",\"normal\",\"search\",\"extended\",\"指定\",\"デフォルト\",\"normal\",\"モード\"]","add","additional.hive;","all,","apach","apis,","array","basic","boolean","caution:","const","ddl","dependencies.jar.","dependencies.jar;","detail","effort","english","english/japanes","false)","first","follow","follows:","foundat","hivemal","includ","incub","incubator.","input,","issu","it'","japanes","japaneseanalyz","j
 
ar","javadoc","kuromoji.","later.","mode","modul","module.","need","nlp","note","option","pleas","provid","refer","select","signatur","simpl","softwar","sourc","sponsor","stoptags)","stopwords,","support","syntax:","text","token","tokenize(text","tokenize_ja","tokenize_ja(\"kuromojiを使った分かち書きのテストです。第二引数にはnormal/search/extendedを指定できます。デフォルトではnormalモードです。\");","tokenize_ja(text","tolowercas","udf","undergo","us","usag","v0.4.1","well.","xxx"],"ft_engineering/scaling.html":["\":\",","\"age\"","\"balance\"","\"campaign\"","\"day\"","\"duration\"","\"pdays\"","\"previous\"","${max_target})","${mean_target},","${min_target},","${stddev_target})","(","(asf),","(t1.featur",")","),","...","0,","0.51940954","0.51940954;","0.6278076335455348","1","1,","2","3","3.566241460963296","3.566241460963296;","3;","7.899578","7.899578;",";","=","[\"reflectance:0.5252967\",\"specific_heat:0.19863537\",\"weight:0.0\"]","[
 
\"reflectance:0.5950446\",\"specific_heat:0.09166764\",\"weight:0.052084323\"]","[\"reflectance:0.6797837\",\"specific_heat:0.12567581\",\"weight:0.13255163\"]","[\"weight:69.613\",\"specific_heat:129.07\",\"reflectance:52.111\"]","[\"weight:70.67\",\"specific_heat:128.161\",\"reflectance:52.446\"]","[\"weight:72.303\",\"specific_heat:128.45\",\"reflectance:52.853\"]","ag","apach","appli","avg(target),","avg(value)","balanc","befor","both","campaign","collect_list(","collect_list(feature)","complex","concat(feature,","creat","data.","day","durat","e2006tfidf_test","e2006tfidf_train","e2006tfidf_train;","e2006tfidf_train_sc","effort","explod","explode(features)","extract_feature(feature)","extract_weight(feature)","fals","featur","feature(","feature(feature,","feature,","follow","follows:","foundat","fv","group","hivemal","hivevar:max_target=","hivevar:mean_target=","hivevar:min_target=","hivevar:stddev_target=0.6278076335455348;","http://en.wikipedia.org/wiki/feature_scaling#resc",";
 
http://en.wikipedia.org/wiki/standard_scor","id,","if(pday","if(t1.minmax,rescale(t1.value,","incub","incubator.","join","later","limit","max","max(target)","max(value)","mean,","min","min(target),","min(value)","min,","minmax","minmax)","minmax,","more","norm","norm_fv","normal","pdays)","previou","quant","quantative_norm","quantative_stat","replac","rescale(t1.value,","rescale(target,","rowid","rowid,","scale","select","set","softwar","sponsor","stat","stddev","stddev,","stddev_pop(target)","stddev_pop(value)","t1","t1.feature,","t1.id","t1.id,","t2","t2.feature)","t2.max)","t2.max),zscore(t1.value,","t2.mean,","t2.min,","t2.stddev)","t2.stddev))","t;","tabl","target","target,","tip","train","train_norm","true","undergo","union","us","v0.3.2","valu","vector","view","zscore","zscore(t1.value,","zscore(target,","zscore)"],"ft_engineering/hashing.html":["\"movieid#2331\"));","(2^24).","(2^24)]","(a.k.a.","(asf),","(it'","(or","+1'd","0","1","1.","10');","16777216","16777217","2","274
 
6618","2;","3');","3874068","4063537","9566153","[","[\"11293631\",\"3322224\",\"4331412\"]","[\"11293631:0.1\",\"3322224:0.2\",\"4331412:0.3\"]","[\"1803454\",\"6630176\"]","[\"1828616\",\"6238429\"]","[\"1828616:3.3\",\"6238429:4.999\",\"6238429\"]","[\"4063537\",\"8459207\"]","[\"4063537:1.0\",\"4063537\",\"8459207:2.0\"]","[\"7\",\"1\"]","[\"userid#4505\",\"movieid#2331\"]","[\"userid#5689\",\"movieid#3072\"]","[,","[default:","]","alway","apach","appli","array","bia","clause.","consid","const","control","default","describ","differ","effort","element","examples.","extend","featur","feature_hash","feature_hashing('aaa');","feature_hashing('aaa','","feature_hashing(array","feature_hashing(array(\"userid#4505:3.3\",\"movieid#2331:4.999\",","feature_hashing(array('1','2','3'));","feature_hashing(array('1:0.1','2:0.2','3:0.3'));","feature_hashing(array('aaa','bbb'));","feature_hashing(array('aaa','bbb'),'","feature_hashing(array('aaa:1.0','aaa','bbb:2.0'));","feature_hashing(array(1,
 
2,3));","feature_hashing(features),","feature_hashing(null,'","features)","features,","features.","find","follow","foundat","function","functions.","hash","help","help');","help]","hivemal","hivevar:num_features=16777216;","hivevar:num_features=1;","incub","incubator.","int","limit","mhash","mhash('aaa');","mhash('aaa',${num_features});","mhash('aaa:2.0');","mhash(array('aaa','bbb'));","mhash(array('bbb','aaa'));","mhash(str","mhash;","murmurhash3","never","note:","noteth","num_featur","number","number).","option.","options])","order","reserv","return","scalar","select","sentitive.","set","show","softwar","sponsor","start","string","support","system","through","training_fm","trick)","undergo","usage:","valu","value.","values.","vector","word)"],"ft_engineering/selection.html":["#features)","${k})","(","(#classes,","(1,","(\\sigma_{1}","(asf),","(chi2)","(n_class,","(n_classes,","(snr)","(x.#cols,",")","),",");","+","/","1)","2)","3)","=","[udaf]","[udf]","\\mu_{2}|","\\sigma_{2})∣
 
μ​1​​−μ​2​​∣/(σ​1​​+σ​2​​),","aggreg","algorithm","apach","appli","array","array)","array,","array>","array>,","array_avg(y)","array_sum(x)","articl","base","best","between","binar","binari","both","chi","chi2","chi2(observed::array>,","chi2(r.observed,","class","class_prob","classif","classification.","clearly,","col","construction.","creat","criterion","cross","defin","details.","deviat","dot","dot(class_prob.t,","dot(x.t,","each","effort","element","even","events.","expect","expected::array>)::struct,","featur","feature_count)","feature_count,","features,","foundat","function","hivemal","hivevar:k=2;","hot","import","importance_list","importance_list::array,","improv","incub","incubator.","independ","input","int","join","k","k::int)::array","kkk,","kkk.","know","l","l.expected)","label","larger","later.","list","mathemat","matrix","mean","metric,","model","n_class","n_featur","n_features)","nois","note:","number","observ","observed,","omit","on","o
 
utput","p","predict","prediction.","problems.","process","product","r","r.v.chi2,","r;","rank","ratio","rc.1","redund","refer","relev","result","row","score","select","select_k_best(l.x,","select_k_best(x,","select_k_best(x::array,","selection.","set","shape","shorten","signal","signatur","snr","snr(x,","snr(x::array,","snr,","snr;","softwar","sponsor","squar","standard","stat","statist","statistics,","struct,","subset","support","tabl","target","techniqu","test","time,","top","train","transpose_and_dot(class_prob,","transpose_and_dot(x::array,","transpose_and_dot(y,","two","undergo","univari","us","usag","v","v0.5","valu","variabl","vector","vector,","x","x)","y","y)","y.#cols)","y::array)::array","y::array)::array>","μk\\mu_{k}μ​k​​","σk\\sigma_{k}σ​k​​","χ2\\chi^2χ​2​​","∣μ1−μ2∣/(σ1+σ2)|\\mu_{1}"],"ft_engineering/binning.html":["'female'),","'female');","'gender'),","'male'),","(","('emma',","('ethan',","('isabella',","('jacob',","('mason',","('n
 
oah',","('sophia',","(asf),","(bin","(user",")","),",");","0","1","15","15,","2","20","20,","22","22,","3)","3))","35","35,","46","46,","55","55,","=","[\"name#emma\",\"gender#female\",\"age:0\"]","[\"name#ethan\",\"gender#male\",\"age:2\"]","[\"name#isabella\",\"gender#female\",\"age:1\"]","[\"name#jacob\",\"gender#male\",\"age:1\"]","[\"name#mason\",\"gender#male\",\"age:1\"]","[\"name#noah\",\"gender#male\",\"age:2\"]","[\"name#sophia\",\"gender#female\",\"age:2\"]","[auto_shrink:","[udaf]","[udf]","a.","ag","age,","age:int","apach","appli","array","array('age'),","array('name',","array_concat(","auto_shrink","auto_shrink])","b","b.","behavior","bin","bin:","bins.","bins;","boolean","build_bins(age,","build_bins(weight,","categor","categorical_features(","col","creat","cross","data","data.","defin","divid","duplic","effort","entry::","exception.","f=>except","false]","featur","feature_binning(age,","feature_binning(features,","features:","few","first","follows:","foundat","functi
 
on","gender","group","hivemal","id)","incub","incubator.","input","insert","int","int,","int|bigint|float|doubl","join","key:","later.","mani","map","map('age',","map>","method","name","name,","not,","note:","notether","num_of_bin","num_of_bins:","num_of_bins[,","number","output","possibl","pre","prepar","quantil","quantiles)","quantiles.","quantiles:","quantiles_map","quantiles_map)","quantiles_map)/(weight,","quantiles_map:","quantit","quantitative_features(","rc.1","repeat","repeated:","result","sampl","select","separ","serial","signatur","skip","softwar","sponsor","string","string,","support","t","t=>skip,","tabl","table)","throw","trasform","true,","undergo","usag","user","v0.5","val:","valu","values.","variabl","variation:","vector","weight","weight:"],"ft_engineering/pairing.html":["(asf),","apach","effort","featur","foundat","hivemal","incub","incubator.","pair","softwar","sponsor","undergo"],"ft_engineering/polynomial.html":["\"c:0.3\"),","(asf),",")","+","2);","3);","3,","
 >","[\"a:0.5\",\"a^2:0.25\",\"a^3:0.125\",\"b:0.2\",\"b^2:0.040000003\",\"b^3:0.008\"]","[\"a:0.5\",\"a^a:0.25\",\"a^a^a:0.125\",\"a^a^b:0.05\",\"a^b:0.1\",\"a^b^b:0.020000001\",\"b:0.2\",\"b^b:0.040000003\",\"b^b^b:0.008\"]","[\"a:0.5\",\"a^a:0.25\",\"a^a^a:0.125\",\"a^a^b:0.25\",\"a^a^c:0.075\",\"a^b:0.5\",\"a^b^b:0.5\",\"a^b^c:0.15\",\"a^c:0.15\",\"a^c^c:0.045\",\"b:1.0\",\"b^b:1.0\",\"b^b^b:1.0\",\"b^b^c:0.3\",\"b^c:0.3\",\"b^c^c:0.09\",\"c:0.3\",\"c^c:0.09\",\"c^c^c:0.027000003\"]","[\"a:0.5\",\"a^a:0.25\",\"a^a^a:0.125\",\"a^a^c:0.075\",\"a^c:0.15\",\"a^c^c:0.045\",\"b:1.0\",\"c:0.3\",\"c^c:0.09\",\"c^c^c:0.027000003\"]","[\"a:0.5\",\"a^a:0.25\",\"a^b:0.1\",\"b:0.2\",\"b^b:0.040000003\"]","[\"a:0.5\",\"a^b:0.1\",\"a^b^c:0.030000001\",\"a^c:0.15\",\"b:0.2\",\"b^c:0.060000002\",\"c:0.3\"]","[\"a:0.5\",\"a^b:0.1\",\"b:0.2\"]","[\"a:0.5\",\"a^b:0.5\",\"a^b^c:0.15\",\"a^c:0.15\",\"b:1.0\",\"b^c:0.3\",\"c:0.3\"]","[\"a:0.5\",\"a^c:0.15\",\"b:1.0\",\"c:0.3\"]","[,","allow","apach","a
 
ssum","becom","boolean","cautionpolynomi","combinations.","degre","easili","effort","elimin","false);","false,","featur","features,","features.","foundat","function","gener","hivemal","incub","incubator.","inf","inf/","input","int","interact","interactiononly=false,","large.","learn,","linear","model.","n","non","normal","note:","on","polynomi","polynomial_feature(array","polynomial_features(array(\"a:0.5\",\"b:0.2\"),","polynomial_features(array(\"a:0.5\",\"b:0.2\",\"c:0.3\"),","polynomial_features(array(\"a:0.5\",\"b:1.0\",","polynomial_features(array(\"a:0.5\",\"b:1.0\",\"c:0.3\"),","power","powered_features(array","powered_features(array(\"a:0.5\",\"b:0.2\"),","regression/classif","scikit","select","similar","softwar","sponsor","true);","true,","truncat","truncate=true]","truncate=true])","undergo","unnecessari","us","x**n"],"ft_engineering/ft_trans.html":["(asf),","apach","effort","featur","foundat","hivemal","incub","incubator.","softwar","sponsor","transform","undergo"],"ft_e
 
ngineering/vectorization.html":["(a","(asf),",")","*","...)","1","1.0","1.0\",\"poutcome#unknown\"]","2","2;",">",">[\"a:0.2\",\"b:0.3\"]","[\"a:0.2\",\"b:0.3\",\"bool:1.0\"]","[\"a:0.2\",\"b:0.3\",\"whether#sunny\"]","[\"a:0.2\"]","[\"a:1.0\"]","[\"age:39.0\",\"job#blu","[\"age:51.0\",\"job#entrepreneur\",\"marital#married\",\"education#primary\",\"default#no\",\"balance:1443.0\",\"housing#no\",\"loan#no\",\"contact#cellular\",\"day:18.0\",\"month#feb\",\"duration:172.0\",\"campaign:10.0\",\"pdays:","age,job,marital,education,default,balance,housing,loan,contact,day,month,duration,campaign,pdays,previous,poutcom","apach","array","array(\"age\",\"job\",\"marital\",\"education\",\"default\",\"balance\",\"housing\",\"loan\",\"contact\",\"day\",\"month\",\"duration\",\"campaign\",\"pdays\",\"previous\",\"poutcome\"),","avoid","boolean","categor","collar\",\"marital#married\",\"education#secondary\",\"default#no\",\"balance:1756.0\",\"housing#yes\",\"loan#no\",\"contact#cellular\",\"day
 
:3.0\",\"month#apr\",\"duration:939.0\",\"campaign:1.0\",\"pdays:","column","dual;","each","effort","exampl","featur","featurenames,","features,","foundat","gener","hivemal","id,","incub","incubator.","limit","name)","row,","select","softwar","sponsor","tabl","table.","train","treat","true","undergo","us","valu","vector","vectorize_feature(array","vectorize_features(","vectorize_features(array(\"a\"),*)","vectorize_features(array(\"a\",\"b\"),\"0.2\",\"0.3\")","vectorize_features(array(\"a\",\"b\"),\"0.2\",0)","vectorize_features(array(\"a\",\"b\",\"bool\"),0.2,0.3,true)","vectorize_features(array(\"a\",\"b\",\"wheather\"),\"0.2\",\"0.3\",\"sunny\")","w/","weight","y","zero"],"ft_engineering/quantify.html":["${output_row},","(","(asf),","(id,",")","*","*)","0","1","1,0,pdays),","10","102","1028","1029","10;","121","1294","13","14","140","1443","1466","150","16","172","1756","176","18","181","1815","185","2","20","230","235","24","25","26","260","266","27","29","295","3","30","31","3
 
2","324","34","354","36","37","38","39","4","404","41","423","426","43","436","442","474","476","476,0,0,1,27,5,92,4,0,0,0]","486","5","502","51","52","54","567","572","572,0,1,1,5,3,26,24,0,0,0]","574","595","6","62","6217","63","7","707","8","895","9","908","92","939","[1.0,39.0,0.0,0.0,0.0,0.0,1756.0,0.0,0.0,0.0,3.0,0.0,939.0,1.0,0.0,0.0,0.0,1.0]","[10.0,32.0,7.0,1.0,2.0,0.0,1815.0,1.0,0.0,2.0,10.0,6.0,235.0,1.0,6.0,2.0,1.0,1.0]","[2.0,51.0,1.0,0.0,1.0,0.0,1443.0,1.0,0.0,0.0,18.0,1.0,172.0,10.0,0.0,0.0,0.0,1.0]","[3.0,36.0,2.0,1.0,2.0,0.0,436.0,1.0,0.0,0.0,13.0,0.0,567.0,1.0,1.0,2.0,1.0,1.0]","[30,2,1,2,0,1028,1,0,0,4,1,1294,2,0,0,0]","[32,2,0,0,0,6217,0,1,0,18,9,486,2,181,2,1]","[34,5,1,0,0,","[37,1,0,1,0,62,1,0,0,31,8,404,2,0,0,0]","[38,5,1,2,0,","[39,7,1,2,0,426,1,0,1,18,3,1029,1,0,0,0]","[4.0,63.0,3.0,0.0,0.0,0.0,474.0,1.0,0.0,0.0,25.0,2.0,423.0,1.0,0.0,0.0,0.0,1.0]","[41,0,0,0,0,121,0,0,0,13,5,16,6,176,5,3]","[43,4,0,1,0,574,0,0,0,8,5,140,1,0,0,0]","[5.0,31.0,2.0,1.0,2.0,0.0
 
,354.0,1.0,0.0,0.0,30.0,0.0,502.0,1.0,2.0,2.0,2.0,1.0]","[52,8,0,1,0,1466,1,1,0,20,9,150,1,0,0,0]","[54,5,0,0,0,324,0,0,2,13,5,51,1,0,0,0]","[6.0,29.0,0.0,1.0,0.0,0.0,260.0,0.0,0.0,1.0,2.0,3.0,707.0,14.0,0.0,0.0,0.0,1.0]","[7.0,37.0,4.0,0.0,0.0,0.0,52.0,0.0,0.0,0.0,6.0,4.0,908.0,1.0,3.0,9.0,2.0,1.0]","[8.0,32.0,5.0,1.0,0.0,0.0,230.0,0.0,0.0,0.0,18.0,5.0,442.0,1.0,4.0,8.0,1.0,1.0]","[9.0,31.0,6.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,5.0,895.0,2.0,5.0,2.0,1.0,1.0]","admin.","ag","age,","apach","apr","array(age,","asc","aug","balanc","balance,","blue","campaign","campaign,","cast(pday","cellular","collar","column","contact","contact,","dataset","day","day,","default","default,","desc","durat","duration,","educ","education,","effort","employ","entrepreneur","failur","fals","featur","feb","forc","foundat","hivemal","hivevar:output_row=true;","hous","housemaid","housing,","id","id,","if(pdays==","incub","incubator.","index","int","jan","job","job,","jul","jun","later.","limit","loan","loan,","
 
manag","marit","marital,","marri","month","month,","non","note:","nov","number","numbers.","order","output_row,","pday","pdays,","poutcom","poutcome)","poutcome,","previou","previous,","primari","quantifi","quantified_featur","quantified_features(","quantify(","quantify(${output_row},","quantify()","reduc","retir","run","secondari","select","self","sep","servic","set","singl","softwar","sponsor","string","string),","success","support","t","t0","t1","t2","technician","telephon","tertiari","test","train","train;","train_first,","transform","true","undergo","union","unknown","us","v0.4","valu","y","y)","ye"],"ft_engineering/tfidf.html":["\":\",","\"realm:0.03282491756638329\",\"divided:0.03282491756638329\",\"concepts:0.03282491756638329\",\"attainment:0.032824","${n_docs})","&","'/home/myui/tmp/tfidf_test.tsv'","'|'","(","(asf),","(docid,","(docid,word)","(log(10,","(tf.word",")","*","+","...",".04200326112968063\",\"judgement:0.035169554338885474\",\"apply:0.035169554338885474\",\"di
 
sposition:0.035169554338","0.014001086678120098","0.017584777169442737","0.03282491756638329\",\"moral:0.03282491756638329\",\"numerous:0.03282491756638329\",\"philosophical:0.032824917566","0.06564983513276658","0.07033910867777095","0.09484606645205085","0.12","0.13","0.1641245850805637","1","1,","1.0)","1.0);","2","2,","3","38329\",\"application:0.03282491756638329\",\"perspectives:0.03282491756638329\",\"procedural:0.03282491756638329\",","56638329\",\"equity:0.03282491756638329\",\"includes:0.03282491756638329\",\"theology:0.03282491756638329\",\"ethics:","64983513276658\",\"based:0.06564983513276658\",\"religion:0.06564983513276658\",\"viewpoints:0.03282491756638329\",\"","82491756638329\",\"rightness:0.03282491756638329\",\"general:0.03282491756638329\",\"many:0.03282491756638329\",\"dif","885474\",\"given:0.035169554338885474\"","91756638329\",\"fields:0.03282491756638329\",\"often:0.026135361945200226\",\"philosophy:0.026135361945200226\",\"stu","=","[\"action:0.07033910867
 
777095\",\"wisdom:0.05275433288400458\",\"one:0.05275433288400458\",\"understanding:0","[\"justice:0.1641245850805637\",\"found:0.06564983513276658\",\"discussion:0.06564983513276658\",\"law:0.065","abov","act","action","apach","appropri","befor","beta3","calcul","cast(${n_docs}","cast(n_doc","cd","collect_all(concat(word,","collect_list(concat(word,","collect_list(feature(word,","compos","comput","consid","consist","count(distinct","creat","data","defin","delimit","desc;","df","df.docs,","df.word)","df_t","discuss","doc","docid","docid)","docid,","docid/word","docid;","document","document_frequ","download","dy:0.026135361945200226\"]","each","effort","entri","experi","explain","explode(tokenize(page,true))","explode(word2freq)","extern","featur","fering:0.03282491756638329\",\"fairness:0.03282491756638329\",\"social:0.03282491756638329\",\"broadest:0.032824917","field","find","float)/max2(1,df.docs))","float)/max2(1,df_t))","float,","follows:","format","found","foundat","freq","fre
 
q;","group","hive","hive/hivemall.","hivemal","hivevar:n_docs=3;","https://gist.githubusercontent.com/myui/190b91a3a792ccfceda0/raw/327acd192da4f96da8276dcdff01b19947a4373c/tfidf_test.tsv","idf","idf(df_t","idf,","if(x>y,x,y);","incub","incubator.","inpath","int)","int,","is_stopword(word);","join","justic","justice,","knowledg","knowledge,","later","later.","law","link.","load","local","macro","max2(x","n_doc","need","note","number","order","page","pair","pair,","prepar","query.","rationality:0.03282491756638329\",\"including:0.03282491756638329\",\"context:0.03282491756638329\",\"concept:0.032","relat","religion","replac","respectively.","result","row","select","set","softwar","sponsor","store","string","support","t","t2","tabl","table/view","temporari","term_frequ","termin","textfile;","tf","tf(word)","tf.docid,","tf.freq","tf.word,","tf/df","tfidf","tfidf(tf","tfidf(tf.freq,","tfidf))","total","tuples.","undergo","us","v0.3","v0.3.4","valu","vector","view","views,","virtu","well
 
","wget","wikipag","wikipage;","wikipage_explod","wikipedia","willing","wisdom,","word","word)","word,","word2freq","word;","y","~/tmp"],"eval/stat_eval.html":["${mean_actual},2.0))","(","(asf),","(r^2)",")","/","0","0.01","0.02","0.14852283792484033","0.2466732002711477","0.38538660838804495","0.48623913673053565","1","1.9610366706408238","3.8200363760415414","3.8200363760415414;","3.9124877451612488","absolut","actual)","actual))/count(1)","actual)*ln(1","actual,","actual,2.0))/count(1)","actual,2.0))/count(1))","alpha.5","apach","avg(actual),","avg(predicted)","coeffici","comput","determin","e2006","e2006tfidf_pa2a_submit;","effort","error","evalu","example,","explain","follows:","foundat","hive.","hivemal","hivevar:mean_actual=","http://en.wikipedia.org/wiki/coefficient_of_determin","https://www.kaggle.com/wiki/metr","incub","incubator.","logarithm","logloss(predicted,","logloss1,","logloss2","loss","mae(predicted,","mae,","mean","metric","model","mse(predicted,","mse,","predict
 
","predicted)","predicted))/count(1)","predicted,2.0))","r2","r2(actual,","rc.1","refer","regress","rmse(predicted,","rmse,","root","score","select","set","softwar","sponsor","sqrt(sum(pow(predict","squar","statist","sum(abs(predict","sum(actual*ln(predicted)+(1","sum(pow(actu","sum(pow(predict","support","t","t;","tfidf","undergo","union","us","v0.4.1","v0.4.2"],"eval/auc.html":["(","(asf),","(auc)","(i.e.,","(label=0)","(label=1)","(rows)",")","/","0","0.2","0.2)","0.3","0.5","0.54001","0.7","0.8","0.83333","1","1]","5","[0,","abov","above,","above:","allow","anoth","apach","approxim","area","assum","auc","auc(doubl","auc(prob,","auc.","base","better.","between","bin","binari","both","call","case.","classif","classifi","classification.","claus","column","compar","comput","contain","curv","data","desc","descend","differ","distribut","effort","evalu","example,","floor(prob","follow","follows:","foundat","function","gener","give","hand,","henc","higher","hive'","hivemal","hivemall,",
 
"incub","incubator.","input","instance,","int","label","label)","label.","labels.","large,","larger","logarithm","logist","logloss(prob,","loss","mani","mean","meanwhile,","mention","metric","need","neg","negative)","node","note","now","on","onc","one.","order","order,","order.","pair","pairs.","parallel","parallel:","perform","posit","positive/neg","predict","prob","prob,","probabilities)","probability(predict","probability.","probabl","problem","produc","provid","queri","range.","rank","regression.","rel","respect","return","roc","row","rows,","sampl","samples.","score","score)","score,","select","sequenti","shown","simpli","singl","smaller","softwar","sort","sponsor","such","t;","tabl","truth","ultimately,","under","undergo","union","us","way","well.","wide"],"eval/rank.html":["&","(","(1","(2^{\\mathrm{rel}_n}","(\\mathrm{otherwise})","(asf),","(auc)","(i+,i−)(i^+,","(i_n","(itemid","(map)","(max_k)","(mrr)","(n","(ndcg)","(precision@k)","(recall@k)","(scores)","(t1.userid","(
 
the","(userid",")",")(i​+​​,i​−​​)","),","+",",",".","...,","/","0","0.3333333333333333","0.333recall@2=1/3≈0.333.","0.5","0.5555555555555555","0.5precision@2=1/2=0.5","0.6131471927654585","0.613ndcg​2​​=dcg​2​​/idcg​2​​≈0.613.","0.6666666666666666","0.7039180890341349","0.75","0.8128912838590544","0.9187707805346093","1","1)","1,","1.0","1.631idcg​2​​=1/log​2​​2+1/log​2​​3≈1.631.","1/1","1/\\log_2","10.0","1dcg​2​​=1/log​2​​2=1.","1mrr=1/1=1,","1}^{|\\mathcal{i}|}","2","2)","2),","2,","2.0","3","3)","3,","3.0","3\\}i​2​​(u)={1,3}","3\\}u={1,2,3},","4","4)","4,","4.0","4\\}i​u​+​​={1,2,4},","4\\}i​u​+​​={1,2,4}.","5,","5.0","5\\})","6","6,","6.0","6\\}i={1,2,3,4,5,6}","8.0",";","=","=>",">","[","[1,2,4]","[1,3,2,6],","\\\\","\\approx","\\begin{array}{ll}","\\cap","\\cdot","\\end{array}","\\frac{1}{n_{\\mathrm{tp}}}.","\\frac{1}{|\\mathcal{i}^+_u|}","\\frac{2}{3}","\\frac{3}{4}}{3}","\\frac{3}{5
 
}}{3}","\\frac{\\frac{1}{1}","\\frac{\\mathrm{dcg}_k}{\\mathrm{idcg}_k}","\\frac{\\sum_{n=1}^{|\\mathcal{i}|}","\\frac{|\\mathcal{i}^+_u","\\in","\\left[","\\left[i_n","\\left\\{","\\leq","\\log_2(n","\\mathbf{0.756},","\\mathbf{0.806}.","\\mathcal{i}^","\\mathcal{i}^+_u","\\mathcal{i}^+_u)","\\mathcal{i}^+_u\\right]}{\\sum_{n=1}^{|\\mathcal{i}|}","\\mathcal{i}^+_ui​+​​∈i​u​+​​","\\mathcal{i}i​k​​(u)⊂i,","\\mathcal{u}u∈u,","\\mathrm{dcg}_2","\\mathrm{idcg}_2","\\mathrm{map}","\\mathrm{map}(\\mathcal{i}^+_u,","\\mathrm{mrr}","\\mathrm{ndcg}_k","\\mathrm{precision@}k","\\mathrm{precision@}n","\\mathrm{recall@}k","\\mathrm{rel}_n","\\right.","\\right]n​tp​​∈[1,∣i∣],","\\subset","\\sum_{n","\\time","\\{1,","].","_ui​−​​∈i​u​−​​,","_u|∣i​u​+​​∣×∣i​u​−​​∣","abov","above,","above.","accord","accuraci","addit","addition","additionally,","allow","apach","applic","area","argument:","as:","assess","assign","as
 
sum","auc","auc(t1.rec,","auc,","auc_at_2,","averag","average_precision(t1.rec,","average_precision,","average_precision_at_2,","base","basically,","be","be:","before.","behind","best","better","between","binari","built","by:","case","cast(count(itemid)","chapter,","choic","chosen","classif","collabor","collect_set(itemid)","combin","compar","complet","comput","concept","consid","consist","contain","context","convincing,","correct","correspond","cover","coverag","cumul","curv","d_k(n)","d_k(n)},","dcg2=1/log22=1\\mathrm{dcg}_2","dcgk\\mathrm{dcg}_kdcg​k​​","demonstr","denot","depict","describ","determin","differ","directli","discount","dk(n)={(2reln−1)/log2(n+1)(1≤n≤k)0(n>k).","done","dummi","dummy_rec","dummy_rec?","dummy_recrel","dummy_truth","d​k​​(n)={​(2​rel​n​​​​−1)/log​2​​(n+1)​0​​​(1≤n≤k)​(n>k)​​.","each","easi","effici","effort","emphasi","empty.","enabl","equation:","evalu","even","exactli","example,","exist","expec
 
t","figur","filter","final","first","fit","fix","focus","follow","follows:","formul","formulation,","foundat","function","gain","gener","give","grade","group","handl","hence,","here","here,","higher","highest","hivemal","hivemall'","hivemall.","however,","i(u)i(u)i(u)","i(u)i(u)i(u)),","i(u)i(u)i(u),","i+i^+i​+​​","i+∈iu+i^+","i2(u)={1,3}i_2(u)","i2(u)i_2(u)i​2​​(u)","i={1,2,3,4,5,6}\\mathcal{i}","i\\mathcal{i}i,","i^","i_k(u)|}{|\\mathcal{i}^+_u|}.","i_k(u)|}{|i_k(u)|}.","i_k(u)|∣i​u​+​​∩i​k​​(u)∣","i_n","idcg2=1/log22+1/log23≈1.631\\mathrm{idcg}_2","idcgk\\mathrm{idcg}_kidcg​k​​","ik(u)i_k(u)i​k​​(u)","ik(u)i_k(u)i​k​​(u),","ik(u)⊂ii_k(u)","implement","importantly,","incorpor","incub","incubator.","indic","inform","ini_ni​n​​","input","int)","interest","intern","interpret","introduc","inverse:","is,","item","itemid","itemid),","itemid,","items,","items.","items:","iu+={1,2,4}\\mathcal{i}^+_u","iu+\\mathcal{i}^+_ui​uâ€
 
‹+​​","iu+\\mathcal{i}^+_ui​u​+​​.","iu+\\mathcal{i}^+_ui​u​+​​;","i​−​​.","i−i^","i−∈iu−i^","join","k","k)","label","launch","lead","learn","length","list","list,","lists.","machin","map","map(iu+,{1,3,2,4,6,5})=11+23+343≈0.806.","map(iu+,{1,3,2,6,4,5})=11+23+353≈0.756,","map(i​u​+​​,{1,3,2,4,6,5})=​3​​​1​​1​​+​3​​2​​+​4​​3​​​​≈0.806.","map(i​u​+​​,{1,3,2,6,4,5})=​3​​​1​​1​​+​3​​2​​+​5​​3​​​​≈0.756,","map.","map=1∣iu+∣∑n=1∣i∣precision@nâ‹
…
[in∈iu+].","map=​∣i​u​+​​∣​​1​​​n=1​∑​∣i∣​​precision@nâ‹
…
[i​n​​∈i​u​+​​].","map_keys(to_ordered_map(relscore,","map_valu","map_values(to_ordered_map(score,","match","max_k","mean","meanwhile,","measur","measure,","measures,","metric","metric.","more","mpr","mrr","mrr(t1.rec,","mrr,","mrr=1/1=1\\mathrm{mrr}","mrr=1ntp.","mrr=​n​tp​​​​
 
1​​.","mrr_at_2,","much","multipl","n","name","ndcg","ndcg()","ndcg(t1.rec,","ndcg,","ndcg2=dcg2/idcg2≈0.613\\mathrm{ndcg}_2","ndcg_at_2","ndcgk=dcgkidcgk=∑n=1∣i∣dk(n)[in∈iu+]∑n=1∣i∣dk(n),","ndcg​k​​=​idcg​k​​​​dcg​k​​​​=​∑​n=1​∣i∣​​d​k​​(n)​​∑​n=1​∣i∣​​d​k​​(n)[i​n​​∈i​u​+​​]​​,","nnn","non","normal","notation.","notic","now,","ntp∈[1,∣i∣]n_{\\mathrm{tp}}","number","observations.","obtain","order","origin","out","output","over","page","pair","pairs.","pairs:","permutation,","place","portion","posit","positive,","positives.","possibl","practic","precis","precise,","precision(t1.rec,","precision,","precision@1,","precision@2,","precision@2=1/2=0.5\\mathrm{precision@}2","precision@k","precision@k=​∣i​k​​(u)∣​​∣i​u​+​​∩i​k​​(u)∣​​.","precision@k=∣iu+∩ik(u)∣∣ik(u)∣.","precision@∣i∣|\\mathcal{i}|∣i∣,","precision_
 
at_2,","prediction:","problem","problem,","problem.","problems.","process","provid","quantit","queri","query:","rank","reason","rec","rec,","recal","recall(t1.rec,","recall,","recall@2=1/3≈0.333\\mathrm{recall@}2","recall@k","recall@k,","recall@k=​∣i​u​+​​∣​​∣i​u​+​​∩i​k​​(u)∣​​.","recall@k=∣iu+∩ik(u)∣∣iu+∣.","recall_at_2,","reciproc","recommend","recommendation,","recommendation.","rel(expected)","relev","reln={1(in∈iu+)0(otherwise).","reln\\mathrm{rel}_nrel​n​​","reln\\mathrm{rel}_nrel​n​​,","rel​n​​={​1​0​​​(i​n​​∈i​u​+​​)​(otherwise)​​.","respect","respons","responses,","responses.","result","retriev","return","roc","same","sampl","samples.","score","score(predicted)","second","select","separ","set","setting,","show","simpl","simpli","singl","six","size","softwar","solv","specifi","sponsor","struct(relscore,","such","suggest","sum","system,","t1","t1.max_k)","t2","t2.truth,"
 
,"t2.userid)","tabl","table,","tables,","tackl","take","target","th","that,","three","thus,","to_ordered_map(score,","top","true","true)","true))","truth","two","u={1,2,3}\\mathcal{u}","under","undergo","unlik","us","user","userid","userid,","u∈uu","valu","way","well","within","words,","zero","|\\mathcal{i}^","|\\mathcal{i}|","∣iu+∣×∣iu−∣|\\mathcal{i}^+_u|","∣iu+∩ik(u)∣|\\mathcal{i}^+_u","∣i∣|\\mathcal{i}|∣i∣."],"eval/datagen.html":["(asf),","apach","data","effort","foundat","gener","hivemal","incub","incubator.","softwar","sponsor","undergo"],"eval/lr_datagen.html":["\"","(","(asf),","(at","(label,features)","(recommended)",")",");","*","0.0","0.044","0.046","0.13126314\",\"190:0.18610542\",\"131:1.7232913\",\"24:","0.19020283\",\"21:","0.54811275\"]","0.5568947\",\"10:0.621897\",\"6:","0.7220096","0.7274741","0.7346627","0.9842969\",\"177:0.062993184\",\"176:","0/1","1","1.0","10","100","100\")","100')","1000","10k","1;","2","2.7551131\",\"113:","2;","5;
 
","9999","[\"139:1.9607254\",\"110:2.958568\",\"186:3.2524762\",\"31:3.9243593\",\"167:0.72854257\",\"26:1.8355447\",\"117:2.7663715\",\"3:2.1551287\",\"179:3.1099443\",\"19:3.6411424\"]","[\"140:2.8347101\",\"165:3.0056276\",\"179:4.030076\",\"112:3.3919246\",\"99:3.98914\",\"16:3.5653272\",\"128:3.046535\",\"124:2.7708225\",\"78:2.4960368\",\"6:1.7866131\"]","[\"34:2.9269936\",\"35:0.37033868\",\"39:3.771989\",\"47:2.2087111\",\"28:2.9445739\",\"55:4.134555\",\"14:2.4297745\",\"164:3.0913055\",\"52:2.0519433\",\"128:2.9108515\"]","[\"73:3.4391513\",\"198:4.42387\",\"164:4.248151\",\"66:3.5224934\",\"84:1.9026604\",\"76:0.79803777\",\"18:2.2168183\",\"163:2.248695\",\"119:1.5906067\",\"72:2.0267224\"]","[\"84:","[\"84:3.4227803\",\"80:3.8875976\",\"58:3.2909582\",\"123:3.1056073\",\"194:3.3360343\",\"199:2.20207\",\"75:3.5469763\",\"74:3.3869767\",\"126:0.9969454\",\"93:2.5352612\"]","[\"98:4.2451696\",\"4:3.486905\",\"133:2.4589922\",\"26:2.7301126\",\"103:2.6827147\",\"2:3.619825
 
4\",\"34:3.7042716\",\"47:2.5515237\",\"68:2.4294896\",\"197:4.4958663\"]","[4.061373,3.9373128,3.5195694,3.3604698,3.7698417,4.2518,3.8796813,1.6020582,4.937072,1.5513933,3.0289552,2.6674519,3.432688,2.980945,1.8897587,2.9770515,3.3435504,1.7867403,3.4057906,1.2151588,5.0587463,2.1410913,2.8097973,2.4518871,3.175268,3.3347685,3.728993,3.1443396,3.5506077,3.6357877,4.248151,3.5224934,3.2423255,2.5188355,1.8626233,2.8432152,2.2762651,4.57472,2.2168183,2.248695,3.3636255,2.8359523,2.0327945,1.5917025,2.9269936,0.37033868,2.6151125,4.545956,2.0863252,3.7857852,2.9445739,4.134555,3.0660007,3.4279037,2.0519433,2.9108515,3.5171766,3.4708095,3.161707,2.39229,2.4589922,2.7301126,3.5303073,2.7398396,3.7042716,2.5515237,3.0943663,0.41565156,4.672767,3.1461313,3.0443575,3.4023938,2.2205734,1.8950733,2.1664586,4.8654623,2.787029,4.0460386,2.4455893,3.464298,1.062505,3.0513604,4.382525,2.771433,3.2828436,3.803544,2.178681,4.2466116,3.5440445,3.1546876,3.4248536,0.9067459,3.0134914,1.9528451,1.71
 
75893,2.7029774,2.5759792,3.643847,3.0799,3.735559]","apach","array","cl\"","cl\")","classif","count(*)+1","count(1)","creat","data","dataset","dataset.","default","default,","dens","desc","detail","distribut","dual","dual;","dummi","effort","featur","fetched:","find","float","follows:","foundat","gener","generate_series(1,${n_parallel_datagen})","generated.","help').","hive>","hivemal","hivevar:n_parallel_datagen=10;","incub","incubator.","insert","int","label","label.","limit","logist","lr_datagen(\"","lr_datagen('","lrdata1k","lrdata1k;","mapred.reduce.tasks=","mapred.reduce.tasks=${n_parallel_datagen};","max)","multipl","n_dim","n_exampl","n_featur","none","ok","option","option,","parallel","reduc","reducers.","regress","regression_data1","regression_data1;","regression_data_dens","regression_data_dense;","replac","reset","row(s)","run","scalabl","seconds,","seed","select","seq10","seq10;","set","singl","softwar","spars","sponsor","t","tabl","taken:","task","time","undergo","us"
 
,"value;","view","well"],"misc/prediction.html":["\"model\"","\"predict","(0/1","(\\mathbf{x}_2,","(\\mathbf{x}_n,","(asf),","(i.e.,","(input)","(integer)","(output)","(sgd)","(synonym:","(x1,y1),(x2,y2),⋯,(xn,yn)(\\mathbf{x}_1,","(xi,yi)(\\mathbf{x}_i,","(λ\\lambdaλ","+","...","0","0,","0.54,","1","1,","1/1),","17.1","2","2.","21.3","42.195,","6.2",":=","[\"1:0.001\",\"4:0.23\",\"35:0.0035\",...]","[\"1:0.2\",\"3:0.1\",\"13:0.005\",...]","[\"5:1.3\",\"22:0.0.089\",\"77:0.0001\",...]","\\cdots,","\\frac{1}{n}","\\lambda","\\mathbf{x}_i,","\\sum_{i=1}^{n}","abov","accuracy.","achiev","adadelta","adagrad","adam","additionally,","algorithm","anoth","apach","applied.","appropri","articl","as:","assum","auxiliari","base","before,","behav","below","below:","binari","briefli","build","call","case","categor","choic","class","classif","classification,","classification.","classifier,","classifiers.","click","combin","condit","configur","construct","constructed.","context","contrast","cont
 
rol","ctr","current","demonstr","depend","descent","describ","design","detect","differ","differently;","document","e(\\mathbf{w})","e(w):=1n∑i=1nl(w;xi,yi)+λr(w)","e(w):=​n​​1​​​i=1​∑​n​​l(w;x​i​​,y​i​​)+λr(w)","e(w)e(\\mathbf{w})e(w)","e.g.,","effect","effort","elasticnet","enabl","epsilon_intensitive)","epsiloninsensitiveloss","error:","estim","even","eventually,","example,","example.","explain","extern","fail","featur","find","first","fitting.","flexibl","float","float/int","follow","follows:","for:","foremost,","formul","formulation,","foundat","function","function,","function.","function.)","function:","functions.","futur","gener","given","goal","gradient","guid","helpful.","here,","higher","hinge)","hingeloss","hivemal","hivemall'","hivemall,","hivemall:","huber)","huberloss","huberloss.","implement","importantly,","in:","incub","incubator.","input","input:","inputs.","insensit","interestingly,","iri","itself","kind","know:","l(\\mathbf{w}
 
;","l(w;xi,yi)l(\\mathbf{w};","l1","l2","label","labels:","learn","learning,","learnt.","list","log,","logistic)","logloss","loss","loss,","loss_funct","machin","mainli","make","mathemat","mean","minim","mllib","model","models,","modified_huber)","modifiedhuberloss","more","multi","need","neg","negative/posit","new","news20","normal","noteopt","number","numer","obtain","on","onc","opt,","optim","option","order","output","output:","over","pair","paramet","parameters)","point","possibl","practice,","predict","prediction.","prevent","problem","problem\"?","problem.","problems,","produc","provid","quantile)","quantileloss","r(\\mathbf{w})","r(w)r(\\mathbf{w})r(w)","range,","rate","rda","rda,","real","realiz","reason","reg,","regress","regression,","regression.","regular","repres","resources:","sampl","samples,","scikit","seen","set","sever","sgd","shown","singl","small","small/larg","softwar","solut","solv","sometim","spam","spark","sponsor","squared)","squared_epsilon_intensitive)","sq
 
uared_hinge)","squaredepsiloninsensitiveloss","squaredhingeloss","squaredloss","stochast","successfulli","target","task","techniqu","technique,","through","train","train_classifi","train_classifier()","train_classifier,","train_regress","train_regression()","tri","tutori","two","type","undergo","unforeseen","us","user","valu","value,","values,","values.","variant","vector","w\\mathbf{w}w","w\\mathbf{w}w.","way","weight","well:","work","x\\mathbf{x}x","y_1),","y_2),","y_i)","y_i)(x​i​​,y​i​​)","y_i)l(w;x​i​​,y​i​​)","y_n)(x​1​​,y​1​​),(x​2​​,y​2​​),⋯,(x​n​​,y​n​​),","yyi"],"binaryclass/general.html":["${n_samples}","${total_steps}","${total_steps}')","&","'","(","(asf),","(case","(feature,","(logress).","(t.featur","(t.rowid",")","),","*","/","0.0","0.5","1.0","10')","=",">=","a9a","a9a_test","a9a_test;","a9a_train","a9a_train;","abov","accuraci","actual","actual,","adadelta","adagrad","adagradrda","addition,","aggress","a
 
pach","arow","avg(weight)","base","batch","befor","binari","briefli","build","chapters,","choic","classif","classifi","classification:","classification_model","compar","comparison","comput","configur","configuration.","count(1)","creat","cw","data.","differ","does.","each","effort","end)a","eta","evalu","explode(add_bias(features))","extract_feature(feature)","extract_weight(feature)","featur","feature,","feature;","first","follow","formul","foundat","function","function.","function:","functions:","further","gener","group","guide,","hence,","here,","hive>","hivemal","hivevar:n_samples=16281;","hivevar:total_steps=32561;","however,","ideal","implement","incub","incubator.","indic","instructions.","interfac","interface,","introduc","it.","join","label","label,","later","later.","left","likewise,","logist","logloss","logress","logress()","logress(add_bias(features),","loss","m","m.feature)","mani","manner","map","mathemat","mini","mini_batch","model","n_sampl","need","next","note","not
 
ethi","opt","option","options.","other.","outer","page","paramet","part","particular,","passiv","pd","pd.label","pd.prob","pd.rowid)","perceptron","predict","predicted,","predicted;","prediction:","prepar","prob,","probabl","provid","queri","queries,","rc.1","reg","regress","regression.","regressor","results:","rowid,","same","sampl","scw","see","select","set","settings.","sgd","show","sigmoid(sum(m.weight","similar","simpl","simpler","softwar","sponsor","submit","support","t","t.label","t.rowid","t.rowid,","t.value))","tabl","tasks}:","test_explod","thus,","time,","total_step","train","train_classifi","train_classifier().","train_classifier(add_bias(features),","train_classifier.","tri","tutori","two","under","undergo","us","usag","user","util","v0.5","valu","variant","varieti","view","vs.","weight","weight)","without","work","{#"],"binaryclass/a9a.html":["(asf),","a9a","apach","effort","foundat","hivemal","incub","incubator.","softwar","sponsor","tutori","undergo"],"binaryclass/a9
 
a_dataset.html":["\",\"","\"s/","\"s/+1/1/\"","'/dataset/a9a/test';","'/dataset/a9a/train';","'\\t'","(","(asf),",")","/dataset/a9a/test","/dataset/a9a/train","/mnt/archive/datasets/classification/a9a","1/0/\"",">","a9a","a9a.t","a9a.test","a9a.train","a9a;","a9atest","a9atrain","apach","array","awk","cd","collect","conv.awk","copyfromloc","creat","data","databas","delimit","e","effort","extern","f","featur","field","float,","format","foundat","fs","hadoop","hdf","hivemal","http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#a9a","incub","incubator.","int,","item","label","locat","mkdir","p","prepar","put","row","rowid","sed","softwar","sponsor","store","tabl","termin","textfil","training/test","undergo","us",";|"],"binaryclass/a9a_lr.html":["\"","\"count(1)","#map","${num_test_instances}","${total_steps}\")","(","(asf),","(e.g.,","(feature,weight)","(learn","(select","(t.featur","(t.rowid",")","*","/","0.0","0.5","0.8430071862907684","1.0","=","==",">=","a9a_model1","
 
a9a_predict1","a9a_submit1","a9atest","a9atest;","a9atest_explod","a9atrain","a9atrain;","actual","actual,","apach","autonom","avg(weight)","cast((cas","cast(featur","count(1)","creat","effort","end)","estimator.","eta","eta0)","evalu","explode(addbias(features))","extract_feature(feature)","extract_weight(feature)","familiar","featur","feature,","feature;","float)","foundat","function.i","group","hivemal","hivevar:num_test_instances=16281;","hivevar:total_steps=32561;","ideal","incub","incubator.","int)","join","label","label,","later","left","logist","logress()","logress(addbias(features),label,\"","m","m.feature)","option","options.","outer","pd","pd.label","pd.prob","pd.rowid);","predict","predicted,","predicted;","prepar","prob,","probabl","rate)","recommend","regress","replac","rowid,","select","set","sigmoid(sum(m.weight","softwar","sponsor","t","t.label","t.rowid,","t.rowid;","t.value))","tabl","tasks\"","those","total_step","total_steps\"","train","udf","undergo","us","valu
 
","view","weight"],"binaryclass/a9a_minibatch.html":["${mini_batch_size}\")","${num_test_instances}","${total_steps}","(asf),","(feature,weight)","(select",")","/","0.8430071862907684","0.8463239358761747","==","a9a_model1","a9a_submit1","a9atrain","actual","apach","appli","avg(weight)","batch","cast(featur","content","count(1)","creat","depend","descent","effort","evalu","example.","explain","feature,","feature;","first.","foundat","gradient","group","hivemal","hivevar:mini_batch_size=10;","hivevar:total_steps=32561;","incub","incubator.","int)","it.","logist","logress(addbias(features),label,\"","mini","mini_batch","minibatch","page","predicted;","refer","regress","replac","select","set","so,","softwar","sponsor","stochast","t","tabl","total_step","train","undergo","weight"],"binaryclass/news20.html":["(asf),","apach","effort","foundat","hivemal","incub","incubator.","news20","softwar","sponsor","tutori","undergo"],"binaryclass/news20_dataset.html":["\"","\",\"","#","$","'/dataset
 
/news20","'\\t'","(","(asf),","(rowid,",")","*","*)","/dataset/news20","/home/myui/tmp/defin","/home/myui/tmp/hivemall.jar;","15000","4996",">","[mac]","add","all.hive;","amplify(3,","apach","array","begin{","binary/test","binary/test';","binary/train","binary/train';","brew","cast(split(feature,\":\")[0]","cast(split(feature,\":\")[1]","cat","cluster","collect","conv.awk","copyfromloc","coreutil","creat","data","databas","dataset.","delet","delimit","effort","explode(addbias(features))","extern","extract_feature(feature)","extract_weight(feature)","f","featur","feature,","feature;","features)","features=\\$2;","field","float)","for(i=3;i","format","foundat","fs","fs=\"","gawk","gsort","hadoop","hdf","head","hivemal","hivevar:seed=31;","http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#news20.binari","incub","incubator.","instal","int)","int,","item","jar","label","label,","label=\\$1;","later","locat","mkdir","news20.binari","news20.random","news20.test","news20.te
 
st.t","news20.train","news20.train.t","news20;","news20b","news20b_test","news20b_test_explod","news20b_train","news20b_train_x3","p","prepar","put","r","rand(${seed});","replac","row","rowid","rowid,","select","set","softwar","sourc","sponsor","store","t","tabl","tail","termin","textfil","training/test","undergo","us","v0.3.1","valu","view","{","}"],"binaryclass/news20_pa.html":["(asf),","(feature,weight)","(pa1)]","(pa2)]","(select","(t.featur","(t.rowid",")","*","/home/myui/tmp/defin","/home/myui/tmp/hivemall.jar;","0.0","0.9459567654123299","0.9597678142514011","0.9601681345076061","0.9603682946357086","1","=","==",">","[passiv","[perceptron]","actual","actual,","add","aggress","aggressive]","all.hive;","apach","build","case","clean","count(1)/4996","creat","delet","drop","effort","end","evalu","feature,","feature;","foundat","group","hivemal","incub","incubator.","jar","join","label","left","m","m.feature)","model","news20b_pa1_model1","news20b_pa1_model1;","news20b_pa1_predict
 
1","news20b_pa1_predict1;","news20b_pa1_submit1","news20b_pa1_submit1;","news20b_pa2_model1","news20b_pa2_model1;","news20b_pa2_predict1","news20b_pa2_predict1;","news20b_pa2_submit1","news20b_pa2_submit1;","news20b_pa_model1","news20b_pa_model1;","news20b_pa_predict1","news20b_pa_predict1;","news20b_pa_submit1","news20b_pa_submit1;","news20b_perceptron_model1","news20b_perceptron_model1;","news20b_perceptron_predict1","news20b_perceptron_predict1;","news20b_perceptron_submit1","news20b_perceptron_submit1;","news20b_test","news20b_test_explod","news20b_train_x3","outer","passiv","pd","pd.label","pd.rowid);","perceptron(addbias(features),label)","perceptron,","predict","predicted;","prepar","replac","select","softwar","sourc","sponsor","sum(m.weight","t","t.label","t.rowid,","t.rowid;","t.value)","tabl","total_weight,","train_pa(addbias(features),label)","train_pa1(addbias(features),label)","train_pa2(addbias(features),label)","udf","undergo","view","voted_avg(weight)","weight"],"bin
 
aryclass/news20_scw.html":["(arow)","(asf),","(cw)","(feature,","(feature,weight)","(feature,weight,covar)","(scw1)","(scw2)","(select","(t.featur","(t.rowid",")","*","/home/myui/tmp/defin","/home/myui/tmp/hivemall.jar;","0.0","0.9459567654123299","0.9579663730984788","0.9597678142514011","0.9601681345076061","0.9603682946357086","0.9655724579663731","0.9659727782225781","0.9661729383506805","1","=",">","[hivemal","accuraci","actual","actual,","adapt","add","algorithm","all.hive;","apach","argmin_kld(weight,","arow","arow,","case","classification.","clean","confid","confidec","count(1)/4996","covar)","creat","cw","cw,","delet","drop","effort","end","evalu","feature,","feature;","foundat","group","hivemal","incub","incubator.","jar","join","label","label)","later]","left","m","m.feature)","news20;","news20b_arow_model1","news20b_arow_model1;","news20b_arow_predict1","news20b_arow_predict1;","news20b_arow_submit1","news20b_arow_submit1;","news20b_cw_model1","news20b_cw_model1;","news2
 
0b_cw_predict1","news20b_cw_predict1;","news20b_cw_submit1","news20b_cw_submit1;","news20b_scw2_model1","news20b_scw2_model1;","news20b_scw2_predict1","news20b_scw2_predict1;","news20b_scw2_submit1","news20b_scw2_submit1;","news20b_scw_model1","news20b_scw_model1;","news20b_scw_predict1","news20b_scw_predict1;","news20b_scw_submit1","news20b_scw_submit1;","news20b_test","news20b_test_explod","news20b_train_x3","outer","pa","pa1","pa2","pd","pd.label","pd.rowid);","perceptron","predict","predicted;","prepar","recommend","regular","replac","scw","scw1","scw2","select","soft","softwar","sourc","sponsor","sum(m.weight","t","t.label","t.rowid,","t.rowid;","t.value)","tabl","total_weight,","train","train_arow(addbias(features),label)","train_cw(addbias(features),","train_scw(addbias(features),label)","train_scw2(addbias(features),label)","udf","undergo","us","v0.1]","v0.2","vector","view","voted_avg(weight)","weight","weight)","weight,"],"binaryclass/news20_adagrad.html":["(adadelta)","(a
 
dagrad)","(asf),","(feature,weight)","(select","(t.featur","(t.rowid",")","*","./tmp/defin","./tmp/hivemal","0.0","0.5","0.9545636509207366","0.9549639711769415","0.9661729383506805","0.9677742193755005","0/1","0/1.","1","1/+1","=","==",">",">=","[adadelta]","[adagrad]","[adagradrda]","actual","actual,","adadelta","adadelta(addbias(features),convert_label(label))","adagrad","adagrad(addbias(features),convert_label(label))","adagrad+rda","adagrad,","adagrad.","adagradrda","adagradrda,","add","all.hive;","apach","appli","beta2","better","build","case","classification,","convert","convert_label(label)","count(1)/4996","creat","current","dependencies.jar;","drop","effort","end","evalu","featur","feature,","feature;","foundat","function.","group","hing","hivemal","implement","implmenet","incub","incubator.","jar","join","label","later.","left","logist","loss","loss.","m","m.feature)","model","news20;","news20b_adadelta_model1","news20b_adadelta_model1;","news20b_adadelta_predict1","news2
 
0b_adadelta_submit1","news20b_adagrad_model1","news20b_adagrad_model1;","news20b_adagrad_predict1","news20b_adagrad_rda_model1","news20b_adagrad_rda_model1;","news20b_adagrad_rda_predict1","news20b_adagrad_rda_submit1","news20b_adagrad_submit1","news20b_test","news20b_test_explod","news20b_train_x3","note","outer","p","p.label","p.rowid);","pd","pd.label","pd.rowid);","perform","predict","predicted;","prepar","problem","regress","regression,","replac","scw1","select","sigmoid(sum(m.weight","softwar","sourc","sponsor","suit","sum(m.weight","support","t","t.label","t.rowid,","t.rowid;","t.value)","t.value))","tabl","take","total_weight,","train_adagrad_rda(addbias(features),label)","udf","undergo","us","v0.3","valu","view","voted_avg(weight)","weight"],"binaryclass/news20_rf.html":["${classification})","'","(","(asf),","(i.e.,","(t.rowid",")","/","0.8112489991993594","0/1","1/1","4996.0","50","71'",";","=","[0,","accuraci","actual","actual,","apach","avoid","cautionlabel","classes.","
 
convert","convert_label(label),","convert_label(t.label)","count(1)","creat","cross","drop","effort","evalu","featur","feature,","feature_hash","features,","forest","forest,","forest.","foundat","function","group","hivemal","hivevar:classification=true;","hyperparamet","i.e.,","incub","incubator.","input","inputs.","join","k","k)","later._","left","libsvm","m","m.model,","m.model_weight,","model_weight)","notethi","number","oob","outer","p","p.predicted.label","p.rowid)","predict","predicted.posteriori)","predicted.posteriori,","predicted;","prepar","random","rc.1","rf_ensemble(predicted.value,","rf_model","rf_model;","rf_predict","rf_predicted;","rowid","rowid,","seed","select","set","softwar","spars","sponsor","submit","support","t","t.features,","t1","tabl","test","train","train;","train_randomforest_classifier(","tree","tree_predict(m.model_id,","undergo","us","v0.5","vector"],"binaryclass/kdd2010a.html":["(asf),","apach","effort","foundat","hivemal","incub","incubator.","kdd201
 
0a","softwar","sponsor","tutori","undergo"],"binaryclass/kdd2010a_dataset.html":["\",\"","${shufflebuffersize},","'/dataset/kdd10a/test';","'/dataset/kdd10a/train';","'\\t'","(","(\"orc.compress\"=\"snappy\");","(algebra))","(asf),","(rowid,","(testing)","(training)",")","*","*)","./tmp/defin","./tmp/hivemall.jar;","/","/dataset/kdd10a/test/kdda.t","/dataset/kdd10a/train/kdda","1;","2","2.73","20,216,830","510,302","8,407,752","add","all.hive;","apach","array","auxiliari","awk","bigint,","cast(split(feature,\":\")[1]","classes:","cluster","collect","conv.awk","creat","data","data:","databas","defin","delimit","effort","explode(addbias(features))","extern","f","featur","feature,","feature;","features)","features:","field","float)","format","foundat","fs","gb","hadoop","hdf","hivemal","hivemall.amplify.seed=32;","hivevar:shufflebuffersize=1000;","hivevar:xtimes=3;","http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#kdd2010","incub","incubator.","insert","int,","item";,
 
"jar","kdd10a_test","kdd10a_test_explod","kdd10a_train","kdd10a_train_orcfil","kdd10a_train_orcfile;","kdd10a_train_x3","kdd2010;","kdda","kdda.t","label","label,","later","locat","make","mapred.reduce.tasks=","mapred.reduce.tasks=64;","number","orc","overwrit","prepar","put","rand();","rand_amplify(${xtimes},","replac","row","rowid","rowid,","select","set","softwar","sourc","split(feature,\":\")[0]","sponsor","store","t","tabl","tblproperti","termin","textfil","training/test","undergo","us","valu","view","|"],"binaryclass/kdd2010a_scw.html":["(asf),","(feature,weight)","(feature,weight,covar)","(select","(t.featur","(t.rowid",")","*","0.0","0.8676038894615345","0.8677782959894337","0.8678037711002504","0.8678096499719774","1","=",">","[hivemal","accuraci","actual","actual,","algorithm","apach","argmin_kld(weight,","arow","arow,","case","count(1)/510302","covar)","creat","cw","cw,","drop","effort","end","evalu","feature,","feature;","foundat","group","hivemal","incub","incubator.","
 
join","kdd10a_arow_model1","kdd10a_arow_model1;","kdd10a_arow_predict1","kdd10a_arow_submit1","kdd10a_cw_model1","kdd10a_cw_model1;","kdd10a_cw_predict1","kdd10a_cw_submit1","kdd10a_pa1_model1","kdd10a_pa1_model1;","kdd10a_pa1_predict1","kdd10a_pa1_submit1","kdd10a_scw_model1","kdd10a_scw_model1;","kdd10a_scw_predict1","kdd10a_scw_submit1","kdd10a_test","kdd10a_test_explod","kdd10a_train_x3","label","later]","left","m","m.feature)","mapred.reduce.tasks=32;","outer","pa,","pa1","pd","pd.label","pd.rowid);","predict","predicted;","replac","scw","scw1","select","set","softwar","sponsor","sum(m.weight","t","t.label","t.rowid,","t.rowid;","t.value)","tabl","total_weight,","train","train_arow(addbias(features),label)","train_cw(addbias(features),label)","train_pa1(addbias(features),label)","train_scw(addbias(features),label)","undergo","v0.1]","v0.2","v0.2alpha3","view","voted_avg(weight)","weight"],"binaryclass/kdd2010b.html":["(asf),","apach","effort","foundat","hivemal","incub","incuba
 
tor.","kdd2010b","softwar","sponsor","tutori","undergo"],"binaryclass/kdd2010b_dataset.html":["\",\"","${shufflebuffersize},","'/dataset/kdd10b/test';","'/dataset/kdd10b/train';","'\\t'","(","(asf),","(bridg","(rowid,","(testing)","(training)",")","*)","./tmp/defin","./tmp/hivemall.jar;","/","/dataset/kdd10b/test/kddb.t","/dataset/kdd10b/train/kddb","19,264,097","2","29,890,095","748,401","add","algebra))","all.hive;","apach","array","auxiliari","awk","cast(split(feature,\":\")[1]","classes:","collect","conv.awk","creat","data","databas","defin","delimit","effort","examples:","explode(addbias(features))","extern","f","featur","feature,","feature;","features)","features:","field","float)","format","foundat","fs","hadoop","hdf","hivemal","hivevar:shufflebuffersize=1000;","hivevar:xtimes=3;","http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#kdd2010","incub","incubator.","int,","item","jar","kdd10b_test","kdd10b_test_explod","kdd10b_train","kdd10b_train;","kdd10b_train
 
_x3","kdd2010;","kddb","kddb.t","label","label,","later","locat","make","number","prepar","put","rand_amplify(${xtimes},","replac","row","rowid","rowid,","select","set","softwar","sourc","split(feature,\":\")[0]","sponsor","store","t","tabl","termin","textfil","training/test","undergo","us","valu","view","|"],"binaryclass/kdd2010b_arow.html":["(asf),","(feature,weight)","(feature,weight,covar)","(select","(t.featur","(t.rowid",")","*","0.0","0.8565808971393678","1","=",">","[hivemal","actual","actual,","apach","argmin_kld(weight,","arow","case","count(1)/748401","covar)","creat","drop","effort","end","evalu","feature,","feature;","foundat","group","hivemal","incub","incubator.","join","kdd10b_arow_model1","kdd10b_arow_model1;","kdd10b_arow_predict1","kdd10b_arow_submit1","kdd10b_test","kdd10b_test_explod","kdd10b_train_x3","label","later]","left","m","m.feature)","mapred.reduce.tasks=32;","outer","pd","pd.label","pd.rowid);","predict","predicted;","replac","select","set","softwar","
 
sponsor","sum(m.weight","t","t.label","t.rowid,","t.rowid;","t.value)","tabl","total_weight,","train","train_arow(addbias(features),label)","undergo","v0.1]","v0.2","v0.2alpha3","view","voted_avg(weight)","weight"],"binaryclass/webspam.html":["(asf),","apach","effort","foundat","hivemal","incub","incubator.","softwar","sponsor","tutori","undergo","webspam"],"binaryclass/webspam_dataset.html":["\",\"","${shufflebuffersize},","'/dataset/webspam/raw';","'\\t'","(","(\"orc.compress\"=\"snappy\");","(asf),","(rowid,","(select","(xtime",")","*","*)","./tmp/defin","./tmp/hivemall.jar;","/dataset/webspam/raw","/dataset/webspam/raw/","1;","70000;","=","\\","add","addbias(features)","all.hive;","apach","array","auxiliari","awk","cach","cast(split(feature,\":\")[1]","caution:","cluster","collect","conv.awk","creat","data","databas","dataset","dataset,","delet","delimit","each","effort","exampl","exist","explode(addbias(features))","extern","f","featur","feature,","feature;","features)","field"
 
,"float)","format","foundat","fs","hadoop","hdf","hive.sample.seednumber=43;","hivemal","hivemall.amplify.seed=32;","hivevar:shufflebuffersize=100;","hivevar:xtimes=3;","http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#webspam","incub","incubator.","insert","int,","item","jar","label","label,","later","limit","locat","lot","make","mapred.reduce.tasks=","mapred.reduce.tasks=128;","memory.","mkdir","n)","orc","overwrit","p","parepar","prepar","put","rand(43)","rand(43);","rand_amplify(${xtimes},","replac","row","rowid","rowid,","rows)","s","s.rowid","s.rowid,","select","set","shufflebuffers","small","softwar","sourc","split(feature,\":\")[0]","sponsor","store","t","t.rowid)","tabl","tablesample(1000","tblproperti","termin","textfil","though","train","undergo","us","valu","view","webspam;","webspam_raw","webspam_test","webspam_test_explod","webspam_train_orcfil","webspam_train_orcfile;","webspam_train_x3","webspam_wc_normalized_trigram.svm","|"],"binaryclass/webspam_s
 
cw.html":["(asf),","(feature,weight)","(feature,weight,covar)","(select","(t.featur","(t.rowid",")","*","./tmp/defin","./tmp/hivemall.jar;","0.0","0.9628428571428571","0.9747428571428571","0.9778714285714286","1","33554432\")","=",">","accuracy:","actual","actual,","add","all.hive;","apach","argmin_kld(weight,covar)a","arow","arow,","case","cast(voted_avg(weight)","count(1)/70000","creat","delet","dens","dim","drop","effort","end","feature,","feature;","float)","foundat","group","hivemal","incub","incubator.","jar","join","label","left","m","m.feature)","model","outer","pa1","pa1,","pd","pd.label","pd.rowid);","predict","predicted;","prepar","replac","scw","scw1","select","softwar","sourc","spars","sponsor","

<TRUNCATED>

Reply via email to