http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/1c94a881/userguide/search_index.json
----------------------------------------------------------------------
diff --git a/userguide/search_index.json b/userguide/search_index.json
index 8e69da9..78d2108 100644
--- a/userguide/search_index.json
+++ b/userguide/search_index.json
@@ -1 +1 @@
-{"index":{"version":"0.5.12","fields":[{"name":"title","boost":10},{"name":"keywords","boost":15},{"name":"body","boost":1}],"ref":"url","documentStore":{"store":{"./":["(asf),","adadelta.","adapt","algorithm","analyt","anomali","apach","architectur","art","batch","build","built","classification,","collect","confid","consid","conversely,","cross","data","design","detection,","eas","effort","engineering.","factor","featur","foundat","function","functionalities:","functions.","hive","hive/pig.","hivemal","incub","incubator.","interface.","introduct","k","learn","learning;","librari","machin","machines,","mainli","model","nearest","neighbor,","number","offer","pig","platform","predict","provid","queri","recommendation,","regression,","regular","run","runtime.","soft","softwar","spark","spark/pig,","sponsor","state","such","support","through","thus,","udf/udaf/udtf","undergo","us","varieti","vectors,","versatil","weight","weighted,"],"getting_started/":["(asf),","apach","effort","founda
 
t","get","hivemal","incub","incubator.","softwar","sponsor","start","summari","undergo"],"getting_started/installation.html":["$","$home/.hiverc","(asf),","(of","./target.","/home/myui/tmp/defin","/home/myui/tmp/hivemal","/tmp/defin","/tmp/hivemal","7","add","all.hiv","all.hive;","alternatively,","apach","automat","bin/build.sh","build","cd","choic","clone","command","defin","docker","e.g.,","each","effort","file.","find","follow","foundat","function","git","given","hadoop","hive","hivemal","hivemall.git","https://github.com/apache/incub","incub","incubator.","instal","jar","java","later","line","load","note","pig","platforms:","prerequisit","run","session.","softwar","sourc","spark","sponsor","start","test","then,","time","time.","two","undergo","v0.13","v0.5.0)","v2.4.0","version,","xxx.jar","xxx.jar;"],"getting_started/permanent-functions.html":["\"hivemall.\"","\"hivemall.*\";","(asf),","/apps/hivemal","/tmp/defin",">","apach","auxiliari","avoid","call","case","cautiony","confir
 
m","creat","databas","database.","databases,","ddl","default","defin","each","effort","exist","first,","follow","follows:","foundat","fs","function","hadoop","hdf","hive","hivemal","hivemall.","hivemall.adadelta","hivemall.adagrad","hivemall;","hiveserv","hivevar:hivemall_jar=hdfs:///apps/hivemall/hivemal","incub","incubator.","instal","jar","later","live","load","mkdir","need","non","p","perman","permanent.hive,","permanent.hive;","prefix","put","queri","scheme,","script","session.","sessions.","set","show","softwar","sourc","specifi","sponsor","step","support","then,","through","udf","udfs.","undergo","us","v0.13","xxx.jar","xxx.jar.jar;"],"getting_started/input-format.html":["\"0\"","\"0:1.0\"","\":\",","\"dog\"","\"height:1.5\"","\"length:2.0\"","\"length:2.0\")","\"name\"),","\"weight\"),","\"xxxxxxx","(","(+1)","(=16777216)","(a.k.a.","(asf),","(binari","(call","(cf.","(e.g.,","(for","(i.e.,","(int","(or","(v0.3.1","(we","(weight)",")","),",");",",\"","..","0","0,","0.0","0.0f
 
","1","1)","1),","1,","1,180.3,70.2","1,cast(nul","1.","1.0","1.0,","1.0.","1.0f","10:3.4","123:0.5","16777216.","2","2^24","3)","34567:0.231","43352:55.3","55.0","55.0);",":","::=","[\"1:3.0\",\"2:4.0\",\"3:5.0\"]","[\"apple:1.0\",\"height:180.3\",\"weight:70.2\"]","[\"apple:1.0\",null,\"weight:70.2\"]","[\"is_cat#1\",\"is_dog#0\",\"is_lion#1.0\",\"is_pengin#true\",\"species#dog\"]","[\"is_cat#1\",\"is_dog#0\",\"is_lion#1.0\",\"is_pengin#true\",null]","[,","[10,7,9]","accept","actual","ad","add_bia","add_feature_index","add_feature_index(array(3,4.0,5))","addit","alternatively,","apach","append","appli","argument","arguments:","array","array<int|bigint|text>","array(\"apple\",\"height\",\"weight\"),","array(\"bias:1.0\"),","array(\"height\",","array(\"height:1.5\",","array(\"id\",","array(\"is_cat\",\"is_dog\",\"is_lion\",\"is_pengin\",\"species\"),","articl","befor","between","bia","bias/dummi","bigint)","bigint,","binari","call","cast","cast(target","categor","categorical_feat
 
ures(","categorical_features(array","class","class)","classif","classifi","click_or_not","column","column.","common","compat","compress","concat(\"weight\",\":\",55.0);","concat(mhash(extract_feature(\"xxxxxxx","concat_array(","consid","const","convert_label(","convert_label(0.0f),","convert_label(1),","convert_label(1.0f)","creat","data","default","denot","describ","detail.","dimens","don't","doubl","double),70.2","dual;","dummi","e.g.","each","ebnf","effort","element","emit_null\"","entry.","exampl","example,","example.","example:","examples.","except","explain","explanatori","explicitli","extract_feature(\"weight:55.0\"),","extract_weight(\"weight:55.0\");","extract_weight(\"xxxxxxx","featur","feature(\"weight\",","feature(mhash(extract_feature(\"xxxxxxx","feature1,","feature2,","feature_index(array(\"10:0.2\",\"7:0.3\",\"9\"));","featurenames,","features)","features,","features.","first","fit","float","float)","follow","follows:","format","format.","format:","foundat","function"
 
,"function)","function.","gener","general,","hand,","happens.","hash","hashing/hash","height,","helper","here","here,","hivemal","hivemall.","huge","hyperparameters).","id,","import","incub","incubator.","index","index)","index.","input","instanc","int","int,","label","label,","label.","large.","later","later)","later,","learning.","less","libsvm","logist","long","machin","memori","mention","mhash","model","multi","name","need","neg","normal","notat","note","note:","null","number","number.","numbers,","omit","option","options])","outofmemori","page","pleas","posit","predict","prepar","primit","probabl","produc","provid","quantit","quantitative_features(","quantitative_features(array","rang","real","refer","regress","regression)","regression,","regression.","repres","reserv","respectively.","respons","response/predictor","row","rowid()","rowid,","scheme","select","setting.","similar","softwar","spaces,","spars","specif","specifi","sponsor","start","statistics).","statistics,","storag
 
e)","string","support","tabl","table.","table;","take","target","target)","target.","text","text.","through","train","trick","true,","two","type","typically,","undergo","us","usual","v0.3","v0.3,","v0.3.2","v0.4.0","valu","variabl","variable,","variable.","variables.","vector","veri","vowpal","wabbit.","weight","weight.","weight:55.0","weight:55.3\")","weight:55.3\"))","weight:55.3\")),","yyyyyi","|"],"misc/funcs.html":["(","(...,","(1.0","(:)*","(arow)","(asf),","(coeffici","(cw)","(f1score","(i.e.,","(pa","(pa)","(scw","(select","(sst).","(string","(sum(1.0","(sum(mean","(zscore)",")","),","*","*)","+",",","..","...","...)","..]","/","0","1","1)","1.0","10')","1296","1;","1k","1st","2","2)","2770","2:v2,","2^2n","2^zoom","3","4","4.0","5","5008","5824","5925","::","=",">",">=","@nonnul","@nullabl","[,","[,int","[1:v1,","[const","[or","[string","])","absolut","actual)","actual,","adapt","add_bias(feature_vector","add_feature_index(array[double]:","add_field_indices(array","aggreg",
 
"aggress","algorithm","amplif","amplifi","amplify(const","angular","angular_distance(ftvec1,","angular_similarity(ftvec1,","anomali","apach","approx_count_distinct(expr","approxim","argmin_kld(float","argument","arow","array","array(l.id))","array)","array,","array:","array>","array[int])","array_hash_values(array","array|int|","attribut","auc","auc(array","augment","auto_shrink","averag","average_precision(array","avg(rating)","b","b])","bag","base","bbit_minhash(array<>","beta=1.0)","between","bf","bf2)","bi","bi[,","bi])","bia","bin","binari","binarize_label(int/long","bins:","bit","bloom","bloom(id)","bloom(movieid)","bloom(str","bloom)","bloom,","bloom1,","bloom2)","bloom_and(bf1,","bloom_and(str","bloom_contains(r.movies,","bloom_contains(str","bloom_contains_any(r.bf,","bloom_contains_any(str","bloom_not(bf)","bloom_not(str","bloom_or(bf1,","bloom_or(str","bloomfilt","boolean","bpr_sampling(int","bprmf_predict(list","bu,","build","build_bins(numb","categor","categorical_featu
 
res(array","chang","changefinder(double|array","changefinder.","chi2(array>","chi2_val","class","classif","classifi","classification=false])","classnames=null)","classweights])","clusterid)","cnt","coeffici","col1,","col2,","colnorm","column","compare,","comput","confid","consid","consist","const","constant","construct","contain","conv2dense(int","convers","correctitem","cosin","cosine_distance(ftvec1,","cosine_similarity(ftvec1,","count(distinct","covar","covar)","covar)))","creat","cross","d)","data","data1","data2","dataset","decis","degre","dens","depth","describ","detail","detect","determination)","differ","differences:","dimensions)","dimsum_mapper(array","distanc","distance),","distance2similarity(float","distribut","diverg","doubl","dual","dual;","each","effort","element","encod","ensembl","error","euclid","euclid_distance(ftvec1,","euclid_similarity(ftvec1,","evalu","exist","expected)","explode(array(1,2,3,4,5))","explode(array(1,3,5,6,8))","export","extract_feature(feature
 
_vector","extract_weight(feature_vector","f","f1","f1score(array[int],","factor","fals","false])","featur","feature(","feature,","feature1,","feature2,","feature_binning(array","feature_hashing(array","feature_index(feature_vector","feature_pairs(feature_vector","feature_vector)","feature_vector,","featurenames,","featurenames=null,","features)","features,","ffm_features(const","ffm_predict(float","field","filter","float","fm_predict(float","fmeasure(array|int|boolean","forest","format","formula","foundat","frequenc","ftvec2)","func(lat,lon,zoom)","func(numb","func(str","function","functions.","gener","geospati","given","googl","group","guess_attribute_types(*)","guess_attribute_types(any,","ham","hamming_distance(a,","hash","have","haversin","haversine_distance(doubl","hing","hitrat","hitrate(array","hivemal","hivemall_version()","hivemall_version();","hot","http://tile.openstreetmap.org/${zoom}/${xtile}/${ytile}.png","http://wiki.openstreetmap.org/wiki/slippy_map_tilenam","https:/
 
/www.google.com/maps/@${lat},${lon},${zoom}z","hyperloglogplu","i,","id","identifi","includ","incub","incubator.","index","index,","indexed_features(doubl","indic","input","int","int/long","intercept,","int|str","item","item,","item_pairs_sampling(array","items,","j,","jaccard","jaccard_distance(a,","jaccard_similarity(a,","javascript/dot]","join","k","k])","key","key(s).","key)","keygroup","keys)","kl","kld(doubl","km","kpa_predict(@nonnul","l","l.*","l.movieid)","l.rate","l.rating,","l.rating;","l.userid)","l1","l1_normalize(ftvec","l2","l2_normalize(ftvec","label","label)","label,","lambda[,","lat,","lat1,","lat2,","lat2tiley(doubl","latitud","latlon_distance(lat1,","lda_predict(str","learn","level","level.","libffm","limit","list","local","locat","logic","logist","logloss(doubl","logrithm","lon,","lon1,","lon2)","lon2,","lon2tilex(doubl","longitud","loss","lr_datagen('","lr_datagen(opt","m1,","machin","mae(doubl","manhattan_distance(list","map","map)","map>","map_url(doubl","map
 
s:","matrix","max","max)","max_item_id","max_label(doubl","maximum","maxrow(ani","mean","mean,","measur","mf_predict(list","mhash(str","mile=false])::doubl","miles]","min","min,","minhash","minhash(ani","minhashes(array<>","minim","minkowski_distance(list","model","model,","model_id,","model_weight=1.0]])","modelid,","more","movi","movieid","mrr","mrr(array","mse(doubl","mu2,","mu]])","mu]]>","multiclass","murmurhash3","n","n_exampl","n_featur","ndcg","ndcg(array","ndims)","negative,","negitem","nois","non","normal","noweight]])","null.","num_of_bins[,","number","numfeatures])","numfeatures],","numhashes,","numhashes])","observed,","on","onehot","onehot_encoding(primit","oob_error_rate>","oob_errors,","oob_tests>","openstreetmap:","option","option])","options,","options])","options],","other","outlier/chang","output,","p)","p_val","page","pare","partial","passiv","perceptron","plsa_predict(str","point","polynomi","polynomial_features(feature_vector","popcnt(a","popcount","populate_n
 
ot_in(list","pos_items,","posit","positem","positem,","positive,","positive/neg","posteriori>","power","powered_features(feature_vector","precis","precision_at(array","pred_model","pred_model>","pred_models,","predict","predicted)","predicted,","prefix","prefixed_hash_values(array","preprocess","prob[,","proba","probabilities>","probability)","pu,","purpos","q,q,c,c,c,c,q,c,c,c,q,c,q,q,q,q,c,q","qi","qi[,","quantified_features(boolean","quantify(boolean","quantil","quantiles)","quantiles_map)","quantitative_features(array","r","r2(doubl","r_i,","r_j","rand_amplify(const","random","randomforest","rank","rankitem","rankitems,","rankitems.s","rankitems.size])","rate","ratio","recal","recall_at(array","recommend","recommends","record","refer","regress","regressor","regular","relat","repres","rescal","rescale(value,","result","return","rf_ensemble(int","rmse(doubl","root","row","row,","rowid,","satisfied_movi","scale","score","score,","see","select","sensit","set","sha","sha1(str","shrin
 
kage,","side","sigma","sigma1,","signal","signatur","similar","similarity,","singular","sketch","snr(array","soft","softwar","sort","sort_by_feature(map","space","spars","special","specifi","spectrum","sponsor","sqrt(sum((x","squar","sst(double|array","standard","start","stddev)","string","string)","string[]","such","sum","sum(|x","t","t;","tabl","take","target","term","text)","tf(string","tile","tile(doubl","tilex2lon(int","tiley2lat(int","time","to_dense_features(array","to_sparse_features(array","topic","topkratesofi,","train","train_arow(list","train_arow_regr(array","train_arowe2_regr(array","train_arowe_regr(array","train_arowh(list","train_bprmf(int","train_classifier(list","train_cw(list","train_ffm(array","train_fm(array","train_gradient_tree_boosting_classifier(array","train_kpa(array","train_lda(array","train_mf_adagrad(int","train_mf_sgd(int","train_multiclass_arow(list","train_multiclass_arowh(list","train_multiclass_cw(list","train_multiclass_pa(list","train_multiclass
 
_pa1(list","train_multiclass_pa2(list","train_multiclass_perceptron(list","train_multiclass_scw(list","train_multiclass_scw2(list","train_multiclass_xgboost_classifier(string[]","train_pa(list","train_pa1(list","train_pa1_regr(array","train_pa1a_regr(array","train_pa2(list","train_pa2_regr(array","train_pa2a_regr(array","train_perceptron(list","train_plsa(array","train_randomforest_classifier(array","train_randomforest_regression(array","train_regressor(list","train_scw(list","train_scw2(list","train_slim(","train_xgboost_classifier(string[]","train_xgboost_regr(string[]","transform","tree","tree_export(str","tree_predict(str","true","truncate])","tupl","two","type","udfs.","undergo","url","us","usage:","useindexasprefix])","user,","userid,","v1,","v2,","valu","value)","value,","values,","var_importance,","variabl","vector","vector)","vectorhav","vectorize_features(array","version","vifj,","vjf,","vjfi,","voted_avg(doubl","w0,","w1,","w2,","w3)","weight","weight,","weight_voted_avg(
 
expr)","wi,","wise","wj,","word","word)","word,","words[,","x","x)","x,","xgboost","xgboost_multiclass_predict(str","xgboost_predict(str","xh,","xi,","xj)","xk,","xtile(lon,zoom)","xtime","xtimes,","xxx;","y","y)","y)^2))","y,","yhat","ytile(lat,zoom)","y|)","y|^p)^(1/p)","zero","zoom","zoom)::bigint","zoom)::doubl","zoom)::int","zscore(value,","{int|string}","|"],"tips/":["(asf),","apach","effect","effort","foundat","hivemal","incub","incubator.","softwar","sponsor","tip","undergo"],"tips/addbias.html":["\"0\"","(\"","(0,0).","(1,1)","(2,2)","(asf),","(feature,weight)","(or","(select",")","1\"","_b","ad","add","add_bias()","addbias()","addbiasudf","alway","apach","avg(weight)","b,","becuas","befor","better","bia","both(important!)","cast(split(feature,\":\")[1]","claus","clause,","consid","creat","cross","data","dataset","default.","detail.","divid","e2006tfidf_pa1a_model","e2006tfidf_test","e2006tfidf_test_explod","e2006tfidf_train_x3","effort","enabl","examples.","exist","explici
 
t","explode(add_bias(features))","express","extract_feature(feature)","extract_weight(feature)","f(x)","f(x).","f(x)=wx+b","f(x)=y,","featur","feature,","feature;","float)","follow","follows.","form","found","foundat","function","group","hivemal","hivemall,","hyperplan","incub","incubator.","label","later","learn","make","model","note","origin","origin.","pa1a_regress(add_bias(features),target)","point","predict","regularization),","rowid,","see","select","softwar","split(feature,\":\")[0]","sponsor","t","tabl","target,","test","then,","train","trainer","training/test","undergo","us","v0.3)","v0.3.1","valu","vector.","view","w,","weight","without","x","y","y=f(x)=wx"],"tips/rand_amplify.html":["${shufflebuffersize}","${shufflebuffersize},","${xtimes}","(","(0.743392)","(0.746214)","(a","(asf),","(copy)","(e.g.,","(external)","(feature,weight)","(rowid,","(sec)","(select",")","*","*)","0.734805","0.743392","0.746214","1","100","116.424","2","2012,","3.","479.855","89.718","abov","acc
 
uraci","actual","algorithm","amplifi","amplifier+clust","amplify(${xtimes},","amplify()","apach","argument","articl","auc","avoid","becom","below:","better","bottleneck","bottleneck.","buffer","cast(avg(weight)","caus","claus","cluster","conclus","converg","creat","cup","data,","deal","definit","descent)","distribut","each","effect","effici","effort","elaps","enumer","even","exampl","example)","example,","example.","examples,","execut","explain","factor","factor.in","feature,","feature;","features)","file","filled.","first","float)","follow","follows:","foundat","function","good","gradient","group","hdfs.","higher","hivemal","hivevar:shufflebuffersize=1000;","hivevar:xtimes=3;","however,","improv","in/out","incub","incubator.","input","instance.","instead","involv","iter","iterations.","job","job.","kdd","key","key.","known","label,","larg","learn","local","logress(features,label)","lr_model_x3","m/r","machin","mandatori","map","mapreduc","merg","method","models.","more","multipl","
 
need","note","oper","order","output","phase","plain","predict","problem","problem.","provid","queri","rand();","rand_amplifi","rand_amplify(${xtimes},","rand_amplify()","rand_amplify(),","random","randomli","reason","recommend","record","reduc","replac","requir","result","return","row","row.","score.","select","set","sever","show","shown","shuffl","shuffled.","similar","singl","slow","small","so,","softwar","sort!","spark","specifi","sponsor","stage","steps.","stochast","suit","t","tabl","task","task.","tasks,","techniqu","then,","through","time","time.","track","train","training_orcfil","training_orcfile;","training_x3","trainning_x3","udtf","undergo","us","user","variants.","veri","view","weight","within","without"],"tips/rt_prediction.html":["\"\\n\"","\"\\t\"","$sqoop_home/lib.","'\\n'","'\\t'","'a9a_model1_tsv'","'features'","'sqoop';","'sqoop'@'%'","'t'","(","(/etc/mysql/my.conf)","(0,1,10)","(0,1,10);","(0.00","(1.0","(asf),","(feature);","(i.e.,","(jdbc","(option","(rowid)",
 
"(t.featur",");","*","+","/","//","/user/hive/warehouse/a9a.db/a9a_model1_tsv","/user/hive/warehouse/a9a.db/a9atest_exploded_tsv","0","0.0","0.0)","0.05595205126313402","0.1310696931351625","0.21053194999694824","0.5,","0.5761121511459351","1","1.0","1.0).","1.0,","1.4.5","1.5259535312652588","10","10;","12427","12427;","12428","16","2.6.","3","3;","5","67","7","73","74","76","82","83",";","=",">","\\","a9a","a9a.*","a9a;","a9a_model1","a9a_model1;","a9a_model1_feature_index","a9a_model1_tsv","a9a_model1_tsv;","a9atest","a9atest_explod","a9atest_exploded_rowid_index","a9atest_exploded_tsv","a9atest_exploded_tsv;","abov","access","achiev","add","alreadi","alternatively,","apach","article,","assum","batch","be","begin","better","bigint,","bin/sqoop","binari","bind_address","boost","btree;","build","build.xml","carri","categor","check","classif","column","configur","connect","connector","creat","data","databas","dbms.","defin","delimit","desc","dir","directori","do","doubl","double)","
 
driver)","drop","each","edit","effort","end;","entri","exist","exp(","explain","explode(add_bias(features))","export","exported.","extend","extract_feature(feature)","extract_weight(feature)","featur","feature,","feature;","field","file","find","finishes,","flush","follows:","forget","format","foundat","function","grant","hadoop","hadoop.","hadoop_common_home=${hadoop_home}","hadoop_conf_dir=${hadoop_home}/etc/hadoop/","hadoop_home=/opt/hadoop","have","hdf","here","hive","hive,","hive.","hivemal","however,","id","identifi","if(sigmoid(sum(t.valu","import","incub","incubator.","index","input","int,","itself","ivy.xml","java.jar","jdbc:mysql://${mysql_host}/a9a","join","label,","languag","later","learn","left","limit","line","list","locat","location:hdfs://dm01:9000/user/hive/warehouse/a9a.db/a9a_model1_tsv","location:hdfs://dm01:9000/user/hive/warehouse/a9a.db/a9atest_exploded_tsv,","logist","lookup","m","m.featur","m.feature)","m.weight))","master","model","mysql","mysql.","mysql>",
 
"mysql_host=dm01","need","node","onlin","online/r","online/realtim","outer","packag","particular","password","patch.","predict","prediction.","prepar","prerequisit","privileg","privileges;","prob","prob,","probabl","process","process;","provid","put","query.","rdbm","read","real","recommend","regress","relat","return","row","rowid","rowid,","rowids.","run","scheme","sec)","select","server","set","shown","sigmoid","sigmoid(sum(m.weight))","sigmoid(sum(t.valu","sigmoid(x","sigmoid;","similar","simpli","slave","so,","softwar","sponsor","sql","sqoop","sqoop.","step)","store","successfulli","support","t","t.rowid","tabl","table,","tables.","target","task.","termin","test","textfil","then,","time","transact","tsv","undergo","uniqu","us","user","usernam","v2.6.0.","valu","view","way","weight","x));","|"],"tips/ensemble_learning.html":["(","(asf),","(label,feature,weight)","(label,feature,weight,covar)","(select","(t.featur","(t.rowid",")","*","/home/myui/tmp/defin","/home/myui/tmp/hivemall
 
.jar;","0.8474830954169797","0.8482344102178813","0.8494866015527173","0.8499874780866516","0.850488354620586","1;",":","=","==","[case1]","[case2]","accuraci","actual","actual,","add","algorithm","all.hive;","apach","argmin_kld(feature,","arow","better","broth","case","cast(featur","clean","cnt","cook","count(1)","count(1)/3993","covar)","creat","cw","default","delet","drop","effort","ensembl","ensemble(model)","ensemble(prediction)","ensemble/mix","evalu","exampl","explain","feature,","feature;","foundat","group","head","hive.exec.parallel.thread.number=8;","hive.exec.parallel=false;","hive.exec.parallel=true;","hivemal","hivemall.two","incub","incubator.","int)","jar","join","label","label)","label,","later","learn","learning.","left","let'","m","m.col0","m.col1","m.feature)","m.label","m.label,","mani","mapred.reduce.tasks=","mapred.reduce.tasks=4;","maxrow(cnt,","maxrow(score,","model","news20mc_arow_predict1","news20mc_cw_predict1","news20mc_ensemble_model1","news20mc_ensemble
 
_model1;","news20mc_ensemble_predict1","news20mc_ensemble_predict1;","news20mc_ensemble_submit1","news20mc_ensemble_submit1;","news20mc_pred_ensemble_predict1","news20mc_pred_ensemble_submit1","news20mc_scw2_predict1","news20mc_test","news20mc_test_explod","news20mc_train_x3","one?","outer","pd","pd.label","pd.rowid);","predict","predicted;","prepar","replac","reset","rowid","rowid,","run","score","score,","scw2","select","set","softwar","sourc","spoil","sponsor","stabl","sum(m.weight","t","t.label","t.rowid,","t.value)","t1","t2","t2;","t3;","tabl","train","train_multiclass_arow(add_bias(features),label)","train_multiclass_cw(add_bias(features),label)","train_multiclass_scw(add_bias(features),label)","udf","undergo","unfortunately,","union","v0.1","v0.2","verifi","view","voted_avg(weight)","weight"],"tips/mixserver.html":["\"","#","(3","(asf),","(feature,weight)","(mix","(netty,jsr305)","(select","(w/","(w/o",")","./run_mixserv.sh","0.844835019263103","0.8678096499719774","11212","
 
32","5","abov","access","accuraci","ad","apach","assum","asynchron","better","bin/run_mixserv.sh","block","brief","cast(voted_avg(weight)","caution:","certain","classifiers.","cluster","commun","configur","contain","converg","creat","current","dataset.","default","dependencies.jar","design","detail","due","effect","effici","effort","enabl","enough","exampl","experience,","explain","explan","fast","faster","feature,","feature;","file","find","first,","float)","follow","follows:","foundat","furthermore,","gbe","group","hadoop","handl","hive.","hivemal","hivemall.","horizont","host01,","host01,host02,host03\")","host03","host03.","i/o.","improv","incub","incubator.","instal","installation.","intern","jar","kdd10a_pa1_model1","kdd10a_train_x3","kdd2010;","kdd2010a","larg","later","make","minimum","mix","mix\"","mix)","mix).","mixing.","mixserv.jar","mixserver.java","model","multipl","neglig","networking.","node","nodes.","nodes:","non","normal","now,","option","options.","overhead","pa1
 
","page,","perform","port","port\"","predict","prerequisit","protocol","put","query.","recommend","requir","run","run_mixserv.sh.","scalabl","see","seen","select","server","server(s)","server)","servers.","set","simpl","size","size).","slide.","softwar","sponsor","standard","sure","t","tabl","target/hivemal","though.","through","throughput","thu","time","train","train_pa1(add_bias(features),label,\"","undergo","us","v0.3","weight","worker"],"tips/emr.html":["\"","\",\"","\"hive","\"hivemal","\"instal","\"instance.ismaster=true,s3://${s3bucket}/emr/conf/emr_hivemall_bootstrap.sh\"","\"instance.ismaster=true,s3://mybucket/emr/conf/emr_hivemall_bootstrap.sh\"","${s3bucket}/datasets/news20b/[train|test].","${s3bucket}/emr/conf","${s3bucket}/emr/log","${s3bucket}/emr/output","'\\n'","'\\t'","'s3://${s3bucket}/emr/outputs/news20b_arow_model1';","'s3n://${s3bucket}/datasets/news20b/test';","'s3n://${s3bucket}/datasets/news20b/train';","(","(arow)","(asf),","(emr).http://docs.aws.amazon.com
 
/elasticmapreduce/latest/developerguide/emr","(feature,weight)","(rowid,","(select","(t.featur","(t.rowid",")","*","*)","./elast","./tmp/defin","./tmp/hivemall.jar;","0.0","0.175","0.35","0.7","0.9659727782225781","1","100","1000,","1a","2","3","3.0.0\".","8","=","==",">","\\","action","actions/configur","actions/instal","actions/run","actual","actual,","adapt","add","aliv","all.hive;","amazon","ami","amplify(3,","ap","apach","arg","array","avail","befor","best","bid","bootstrap","both","c,fs.s3n.multipart.uploads.enable=true,","c,fs.s3n.multipart.uploads.split.size=67108864\"","case","cast(rand(47)","cast(rand(49)","cast(rand(50)","cast(split(feature,\":\")[0]","cast(split(feature,\":\")[1]","cast(voted_avg(weight)","cheap","clean","cli","client","cluster","cluster\"","collect","core","core/task","count","count(1)/4996","creat","data","databas","debug","default","delimit","drop","e.g.,","effort","elast","emr","emr_hivemall_bootstrap.sh","enabl","end","evalu","exist","explode(add_bi
 
as(features))","extern","featur","feature,","feature;","features)","field","float","float)","follows.","follows:","format","foundat","ganglia","ganglia\"","group","gui","hadoop","hadoop,","hive","hive.html","hivemal","hivevar:s3bucket=your_bucket_name;","i'm","incub","incubator.","input","insert","instanc","instead","int)","int),","int);","int,","interact","item","jar","job","job,","join","label","label,","larg","later","latest","launch","learn","left","line","locat","log","lunch","m","m,mapred.child.java.opts=","m,mapred.tasktracker.map.tasks.maximum=7,","m,mapred.tasktracker.reduce.tasks.maximum=2,","m.feature)","m1.larg","m1.medium","m1.xlarg","mapred.max.split.size=67108864;","mapreduc","master","mode.","money.","name","news20;","news20b_arow_model1","news20b_arow_model1;","news20b_arow_predict1","news20b_arow_predict1;","news20b_arow_submit1","news20b_arow_submit1;","news20b_test","news20b_test_explod","news20b_train","news20b_train;","news20b_train_x3","northeast","old","optio
 
nally,","or,","outer","output","overwrit","pd","pd.label","pd.rowid);","predict","predicted;","prepar","prerequisit","price","put","rand_amplify(3,","recommend","regular","replac","row","rowid","rowid,","run","s3,","s3://elasticmapreduce/bootstrap","s3://mybucket/emr/log","s3n://${s3bucket}/emr/log","save","select","set","setup\"","site.xml","site=s3://${s3bucket}/emr/conf/h","size","softwar","sourc","specifi","split","sponsor","spot","store","string,","sum(m.weight","t","t.label","t.rowid,","t.rowid;","t.value)","tabl","task","termin","test","textfil","then,","through","tip","total_weight,","train","train_arow(add_bias(features),label)","tsv","type","undergo","uri","us","user","usual","valu","vector","version","view","way","weight","wizard.","work","xmx1536m,","yarn","yarn.","zone"],"tips/general_tips.html":["(asf),","apach","effort","foundat","gener","hive/hadoop","hivemal","incub","incubator.","softwar","sponsor","tip","undergo"],"tips/rowid.html":["${sequence_number}","${task_id
 
}","'","'')","',","()","(asf),","*","..;","a9atest;","ad","also,","anoth","apach","becom","creat","dataset","each","effort","execut","foundat","function","gener","hivemal","however,","incub","incubator.","larg","later.","long","option","over","provid","queri","rc.1","reducer.","regexp_replace(reflect('java.util.uuid','randomuuid'),","return","row","row_number()","row_number().","rowid","rowid()","rowid,","rownum()","scheme","select","singl","slow","softwar","sponsor","sprintf(`%d%04d`,sequence,taskid)","sql","string","support","tabl","undergo","uniqu","us","v0.2","v0.5","xxx","xxx;"],"tips/hadoop_tuning.html":["\"","(1","(2^24","(asf),","(assum","(e.g.,","(float)","(heuristics)","(iff","(mr","(short)","(use","(yarn)","*","0.5","0.6)","1.2","1024mb","161mb","2","2048","2048mb","2^24","2^25","2^25)","4","820","820mb","=","abov","amplify()).","apach","avail","byte","calculated)","case.","chang","compon","configur","consum","covari","default)","default.","dens","densemodel\"","effort","
 
engin","estim","execut","feature_dimens","follow","follows:","formula","foundat","guid","hadoop","hash","here","hive","hive.execution.engine=mr;","hive.execution.engine=tez;","hivemal","hivemall.","http://hadoopbook.com/","http://www.slideshare.net/cloudera/mr","import","incub","incubator.","io.sort.mb=1024","larg","make","mapper","mapper.","mapred.job.reduce.input.buffer.percent=0.2","mapred.map.child.java.opts=\"","mapred.reduce.child.java.opts=\"","mapred.reduce.shuffle.input.buffer.percent=0.6","mapreduc","mapreduce.framework.name=yarn","mapreduce.framework.name=yarn;","mapreduce.map.java.opt","mapreduce.map.java.opts=\"","mapreduce.reduce.input.buffer.percent)","mapreduce.reduce.input.buffer.percent=0.2","mapreduce.reduce.java.opt","mapreduce.reduce.java.opts=\"","mapreduce.reduce.shuffle.input.buffer.percent=0.6","mapreduce.task.io.sort.mb","mapreduce.task.io.sort.mb=1024","max","mb","memori","model","model,","model.","moreover,","note:","old","option","perf","plain","pleas","
 
possible.","predict","prerequisit","queries.","rand_amplify()).","recommend","reduc","reducer.","refer","represent","run","set","setting:","side","so,","softwar","spaceefficientdensemodel","spaces.","spars","sponsor","table)","tez","tez;","train","tune","tuning:","undergo","us","used,","v1)","xmx2048m","xx:+printgcdetails\"","≈"],"troubleshooting/":["(asf),","apach","effort","foundat","hivemal","incub","incubator.","softwar","sponsor","troubleshoot","undergo"],"troubleshooting/oom.html":["(a","(asf),","(mapred.child.java.opts/mapred.map.child.java.opts)","amplify(),","apach","befor","caus","certain","cloud","default","due","dure","each","effort","error","exampl","first","fit","foundat","hadoop","happen","hivemal","hivemall.","increases)","incub","incubator.","input","instead.","larg","larger","mapper","mapred.max.split.s","mapred.max.split.size=67108864;","mapred.reduce.task","mapred.reduce.tasks=64;","memory.","merg","middl","model","number","oom","outofmemoryerror","parameters."
 
,"possible.","rand_amplify()","reduc","revis","set","setting,","shuffle/merg","shuffle/reduc","size","smaller","softwar","split","sponsor","step,","still","that,","then,","train","trainer","training.","tri","undergo","us","valu"],"troubleshooting/mapjoin_task_error.html":["(asf),","0.11.0,","apach","auto","befor","complex","convers","default.","disabl","effort","enabl","error:","except","execut","follows.","foundat","gener","hive","hive.auto.convert.join","hive.auto.convert.join=false;","hivemal","incub","incubator.","join","map","object","object.","queri","semanticexcept","semanticexception,","serial","set","softwar","sometim","sponsor","task","throw","undergo","us","views,","workaround"],"troubleshooting/asterisk.html":["(asf),","4181","alia","alias,","apach","argument","asterisk","effort","explicitly.","fix","foundat","hive","hivemal","incub","incubator.","name","part","possibl","release.","see","softwar","specifi","sponsor","tabl","udtf","undergo","us","v0.12","without","work","
 
workaround","working."],"troubleshooting/num_mappers.html":["#","(asf),","(i.e.,","2.x","apach","block","configur","control","default","default.","effort","foundat","give","hadoop","hdfs)","hive.input.format","hive.input.format.","hive.input.format=org.apache.hadoop.hive.ql.io.hiveinputformat;","hive.tez.input.format;","hive.tez.input.format=org.apache.hadoop.hive.ql.io.hiveinputformat","hivemal","incub","incubator.","input","less","mapper","mapreduce.job.maps=128;","maximum","note","number","org.apache.hadoop.hive.ql.io.combinehiveinputformat.","org.apache.hadoop.hive.ql.io.hiveinputformat","set","setting:","size","softwar","split","sponsor","table.","tez","tri","undergo","us","via"],"troubleshooting/mapjoin_classcastex.html":["(asf),","1.3.0.","[workaround]","apach","array","caus","caution:","classcastexcept","column(s).","contain","detail.","effort","fix","follows:","foundat","hive","hive.mapjoin.optimized.hasht","hive.mapjoin.optimized.hashtable=false;","hive_11051","hivemal","i
 
ncub","incubator.","join","map","refer","serial","set","side","softwar","sponsor","tabl","tez","tri","undergo"],"misc/generic_funcs.html":["\"456\",","\"a\",\"b\",\"c\"","\"age\"","\"age\",","\"apple\"","\"city\",","\"eight\",","\"five\",","\"four\",","\"japan\",","\"john\",","\"makoto\"","\"name\"","\"nine\",","\"one\"","\"one\",","\"osaka\")","\"person\"","\"seven\",","\"six\")","\"six\",","\"ten\"),","\"three\")","\"three\",","\"tokyo\")","\"tokyo\"),","\"two\"","\"two\",","&lt;=","'","');","'[0.1,1.1,2.2]',","'age')","'apple'","'array'","'array')","'array>'),","'banana'","'candy'","'donut'","'egg'","'map')","'price","'struct',","'ti,si,i,bi'","'{","(","(1.0","(alphabetically)","(asf),","(banana","(banana,","(default),","(matrix0.#cols,","(natur","(natural)","(no","(or","(revers","(reverse)","(select","(tail","(top","(æ
 
ª)トンドルiii",")","),","),'array>'),","),'array>');",");","*)","+",",","..)","...","...)","/","0)","0,","0.0')","0.0);","0.0,","0.0f|1.0f","0.0f|1.0f,","04",
 
"1","1)","1),","1,","1,2,3","1,9]","1.0","1.5","10","10,","100'),","100)","100),","1|1","2","2'),","2)","2),","2);","2,","2,1,3,10]","2,10));","2,4),","2.0","20","2018","21","22","23","3","3)","3),","3);","3,","3.0","31)","31),","3600,","37","4","4));","4,","4.0","4]","5","5.0","5]","6","6,","6.0","7","789,","9223372036854775808]",":","=",">","[","[\"aaa\"]","[\"eight\",\"nine\",\"ten\"]","[\"eight\",\"nine\"]","[\"machine\",\"machin","[\"six\",\"seven\",\"eight\",\"nine\",\"ten\"]","[\"six\",\"seven\",\"eight\"]","[\"zero\",\"one\"]","[,","[0.1,1.1,2.2]","[1,2,3,4,5,6,7,8]","[1,2,3,4]","[1,2,3,5]","[1,2,3]","[1,2]","[14,","[2,","[2,3,4]","[2.0,4.0,6.0]","[3,4]","[3.0,5.0,7.0]","[3]","[5,","[apple,","[donut,","[egg,","[{\"city\":\"tokyo\"},{\"city\":\"osaka\"}]","[{\"country\":\"japan\",\"city\":\"tokyo\"},{\"country\":\"japan\",\"city\":\"osaka\"}]","[{\"key\":\"one\",\"value\":1},{\"key\":\"two\",\"value\":2}]","aa+=kaim|wtt!+wbgaa","aaaaaaaaaaaaaaaabbbbccc","accord","add","aggreg
 
","apach","append","apple]","argument","arr","arr,","array","array(","array(\"four\",","array(\"one\",","array(\"zero\",","array('age')","array('city')","array('name',","array('person')","array('ti','si','i','bi')","array()","array(2,","array(314,007))","array(314,007)),","array(true,","array,","array2,","array>,","array_append(array","array_append(array('a','b'),'c');","array_append(array(1,2),3);","array_avg(array)","array_concat(array","array_concat(array(1),array(2,3));","array_flatten(array(array(1,2,3),array(4,5),array(6,7,8)));","array_flatten(array>)","array_intersect(array","array_intersect(array(1,3,4),array(2,3,4),array(3,5));","array_remove(array","array_remove(array(\"aaa\",\"bbb\"),\"bbb\");","array_remove(array(1,null,3),array(null));","array_slice(","array_slice(array","array_slice(array(1,2,3,4,5,6),","array_sum(array)","array_to_str(array","array_to_str(array(1,2,3),'","array_union(array(1,2),array(1,2));","array_union(array(1,2),array(2,3),array(2,5));","array_uni
 
on(array1,","array|const","assert(boolean","assert(pric","averag","b1,","b2,","banana),","base91","base91(binari","base91(deflate('aaaaaaaaaaaaaaaabbbbccc'));","bin)","binari","bits_collect(int|long","bits_or(array","bitset","bitset)","boolean","c","c1,","c2,","candy,","candy]","cast","check","cmpkey,","column","columnnames])","compress","compresseddata)","compressionlevel])","concaten","condit","condition)","condition,","conditional_emit(","conditional_emit(array","conditions,","const","contain","convert","convert_label(const","count(1)","data","date_add(current_date(),value),valu","datetim","decompress","default_valu","deflate(text","deflater.","desc","describ","dimens","distcache_gets(filepath,","distribut","donut]","dot","dot(matrix0.t,","doubl","dunut]","duplic","each","each_top_k(int","effort","egg","egg)]","egg,","elem)","element","element_at(array","element_at(array(1,2,3,4),","element_at(array(1,2,3,4),0);","elimin","emit","end","end)","end.","english","englishtext","entri"
 
,"entry.","errmsg)","error","exist","exp(","expect","explicitli","explode(array(1.0,2.0,3.0,4.0,5.0,6.0,7.0))","fails.","false),","false,","featur","features)","filter","filteringkeys)","first","first_element(array('a','b','c'));","first_element(array());","first_element(x)","five","flattened.","float)","float_array(ndims)","form","form.","form])","foundat","four","from_json(","from_json(str","from_json(to_json(","fun!',","fun\",\"fun\"]","func(boolean","func(str","function","functions.","gener","generate_ser","generate_series(1,3))","generate_series(2,4);","generate_series(4,3);","generate_series(5,1,","generate_series(c1,","generate_series(const","give","given","gram","group,","have","hive","hiveexcept","hivemal","id","importance,","incub","incubator.","index","indexes)","inflat","inflate(binari","inflate(unbase91(base91(deflate('aaaaaaaaaaaaaaaabbbbccc'))));","input","input;","int","intersect","int|bigint","int|const","int|text","int|text|array","invalid","ip_addr","ip_addr)","ip
 
_addr,","ipaddr","is\",\"is\",\"i","is_stopword(str","itself","jobconf","jobconf_gets()","jobid()","json","jsonstring,","k","k)","k,","key","key)","key),","key,","keys)","k|const","l2","l2_norm(doubl","last","last_element(array('a','b','c'));","last_element(x)","learn","learning\",\"learning\",\"learn","length","length])","less","level","list","list,","logic","long","long[]","machin","map","map('a',10,'b',20,'c',30)","map,","map_exclude_keys(map","map_exclude_keys(map(1,'one',2,'two',3,'three'),array(2,3));","map_get_sum(map","map_include_keys(map","map_include_keys(map(1,'one',2,'two',3,'three'),array(2,3));","map_index(a,","map_index(map(\"one\",1,\"two\",2),key)","map_key_values(map(\"one\",1,\"two\",2));","map_key_values(map)","map_tail_n(map","mapred.job.id","mapred.task.partit","mapreduc","maps.","map|value_typ","math","matrix","matrix0_row,","matrix1)","matrix1.#cols)","matrix1_row)","maxsiz","maxsize])","mean","merge_maps(m)","merge_maps(x)","met","minsiz","minsize,","more",
 
"move","moving_avg(numb","moving_avg(x,","msg)","n","n)","named_struct(\"country\",","named_struct(\"name\",","ndim","nfc","nfd,","nfkc,","nfkd","norm","normal","normalize_unicode('㈱㌧㌦â
…²','nfkc');","normalize_unicode('ハンカクカナ
','nfkc');","normalize_unicode(str","note","null","null,","number","object","object.","offset","on","operation.","options])","order","order)","origin","original,","other","output","page","pairs.","parameters.","parsekey])","perform","pos)","posit","postgresql'","price","price,","primit","process","product.","product_id,","pseudo","queri","raise_error('found","raise_error()","rang","record')","regex])","relat","remov","replac","represent","retriev","return","return)","returntyp","reverse'),","reverseorder=false])","row","rowid()","rownum()","rownum,","saniti","see","select","select_k_best(array","sep=','])","sequenc","seri","series;","session.select","session_id,","sessionize(long","sessionize(time,","set","shape","sigmoid(x)","similar","singula
 
r","singularize(lower(\"apples\"));","singularize(str","slice","softwar","sort","sort_and_uniq_array(array(3,1,1,","sort_and_uniq_array(array)","specif","specifi","sperat","split","split_words(str","sponsor","sprintf(%d%04d,sequence,taskid)","src","src,","start","start,","step","step)","stock_pric","stopword","str","string","struct(\"123\",","subarray_endwith(array","subarray_endwith(array(1,2,3,4),","subarray_startwith(array","subarray_startwith(array(1,2,3,4),","subject])","sum","t","t1","t;","tail","take","target","target)","taskid()","text","th","three","thresholdinsec","throw","time","time,","timeinsec,","timeseri","tmp","tmp;","to_bits(array(1,2,3,128));","to_bits(int[]","to_json(","to_json(ani","to_map(key,","to_ordered_list(key)","to_ordered_list(key,","to_ordered_list(primit","to_ordered_list(value,","to_ordered_map(key,","to_string_array(array)","token","tokenize(str","tolowercase])","top","transform","transpose_and_dot(array","true)","true),","true,","try_cast(ani","try_c
 
ast(array(1.0,2.0,3.0),","try_cast(map('a',10,'b',20,'c',30),","two","type.","typename)","unbase91(string)","unbits(bits_or(to_bits(array(1,4)),to_bits(array(2,3))));","unbits(long[]","unbits(to_bits(array(1,4,2,3)));","undergo","union","up","us","uuid","valu","value)","value),","value,","values,","variou","vector","vector_add(array","vector_add(array(1.0,2.0,3.0),","vector_dot(array","vector_dot(array(1.0,2.0,3.0),2);","vector_dot(array(1.0,2.0,3.0),array(2.0,3.0,4.0));","weblog","whether","windowselect","windowsize)","word","word)","word_ngrams(array","word_ngrams(tokenize('machin","words,","x)","x))","x,","x1,","x2,","x_rank(key)","xi)","xxx","y)","{","{\"age\":31}","{\"city\":\"tokyo\"}","{\"col1\":\"123\",\"col2\":\"456\",\"col3\":789,\"col4\":[314,7]}","{\"country\":\"japan\",\"city\":\"tokyo\"}","{\"name\":\"john\",\"age\":31}","{\"name\":\"makoto\",\"age\":37}","{\"ti\":\"123\",\"si\":\"456\",\"i\":789,\"bi\":[314,7]}","{10:\"apple\",4:\"candy\",3:\"banana\"}","{10:\"apple\"
 
,4:\"candy\"}","{10:\"apple\"}","{1:\"one\"}","{2:\"two\",3:\"three\"}","{3:\"banana\",4:\"candy\",10:\"apple\"}","{3:\"banana\",4:\"candy\"}","{3:\"banana\"}","{sequence_number}","{task_id}","{}","|","}","}',","ハンカクカナ"],"misc/topk.html":["${k},","'","(","(asf),","(e.g.,","(int","(partit","(rank,",")","),","*","..","..,","...,","0","0,","0.2","0.4","0.4383084177970886","0.43862903118133545","0.4398220181465149","0.44030147790908813","0.4408798813819885","0.44112563133239746","0.4415401816368103","0.44166821241378784","0.4422193765640259","0.4424300789833069","0.44254064559936523","0.44283604621887207","0.4429032802581787","0.4432108402252197","0.44323229789733887","0.4435907006263733","0.4442034363746643","0.44569307565689087","0.4460843801498413","0.4464914798736572","0.45163780450820923","0.45244503021240234","0.4525672197341919","0.4527127146720886","0.45314133167266846","0.6","0.8","0.8205751180648804","0.822281539440155","0.8241575956344604","0.8255619406700134","0.
 
8271955251693726","0.8301891088485718","0.8328862190246582","0.8340602517127991","0.8344510793685913","0.8390793800354004","0.8438876867294312","0.8439178466796875","0.8463355302810669","0.8467264771461487","0.8499397039413452","0.8516314029693604","0.8562054634094238","0.856602132320404","0.8585299849510193","0.8594650626182556","0.9480557441711426","0.9493276476860046","0.9531533122062683","0.9536819458007812","0.9761330485343933","1","1,","10","10')","10').","10)","10,","100),","10143","10242","10514","10922","10;","11073","11719","12","14073","15173","17218","17582","17782","18541","18556","19468","2","2,","20400","21009","21115","21125","21595","21657","22006","22853","23150","23386","24289","24413","25","2513","25141","25364","25977","26220","27121","3","34","3786","4","5","50","6","60","6598","7","70","7041","7326","7503","8","80","8018","8477","8697","9","90","900","9008","943","9881","=","`each_top_k`","accept","addit","aggreg","altern","alway","amount","angular_similarity(
 
features1,","angular_similarity(t2.features,","apach","appli","approach","arg1,","arg2,","argn)","argn).","argn.","argument","as:","asc,","assum","avoid","b","base_id","base_id,","behav","benef","by)","case","cases.","caution","cautioneach_top_k","cautionin","certain","class","class,","claus","click","clicks,","cluster","collect_list(value)","column","compar","comparison.","complex","comput","consid","consist","cost","creat","cross","crucial","data.","dense_rank","desc)","desc;","differ","distribut","doubl","duplic","each","each_top_k","each_top_k(","each_top_k(${k},","each_top_k(int","each_top_k,","each_top_k.","effici","efficiently.","effort","element","ensur","environ","explicit","explode(m)","extens","fast","featur","features1,","features2),","features2,","follow","follows:","foundat","function","get","group","group,","group.","hanld","help","hive","hive.","hivemal","hivevar:k=","hivevar:k=10;","hivevar:k=5;","http://stackoverflow.com/questions/9390698/h","id","id)","id,","id1",
 
"id1,","id2,","if(valu","incub","incubator.","input","instead","instead.","interact","involv","item","join","k","k,","k.","key","key,","larg","large.","later","later.","left","length","less","limit","list","long","m","mandatori","mani","map.","mapper","massiv","method","mytabl","n","neighbor_id","neighbor_id,","note","noteclust","null","null,","null.","number","o(nm).","or,","order","other_id,","outer","output","over","page","parallel","particularli","process","pseudo","queri","query/32559050#32559050","rand(31)","rank","rank()","rank,","rank/distribut","record","reduc","relat","repres","requir","result","result:","return","revers","rnd","rnd,","run","s01","s02","s03","s04","s05","s05;","same","scheme","score","score,","select","semant","set","shuffling,","side","signatur","similar","similarity,","similarity/dist","similarli","slightli","softwar","sort","sponsor","sql","sql'","standard","student","student)","student,","support","suppos","synonym","t","t01","t02","t03","t04","t05","t
 
1","t1.featur","t1.features),","t1.i","t1.id","t1.id,","t1;","t2","t2.featur","t2.id","t2.id,","t;","tabl","tail","take","test","test_hivemal","test_rnd","that.","then,","third","timestamp","to_ordered_list","to_ordered_list(value,","to_ordered_map","to_ordered_map(key,","top","top/tail","topk","train_hivemal","type","udtf","undergo","union","uniqu","us","usag","user","util","v0.3.2","valu","value)","value,","value.","variabl","veri","view","way","whre","window","x","y","y)"],"misc/tokenizer.html":["\"https://raw.githubusercontent.com/atilika/kuromoji/909fd6b32bf4e9dc86b7599de5c9b50ca8f004a1/kuromoji","\"kuromoji\"","\"normal\",","\"分かち書き\"","\"日本経済新聞,日本","\"関西国際空港,関西",";(a","(asf),","));","/path/to/defin","/path/to/hivemal","0,","2,","=","[\"kuromoji\",\"使う\",\"分かち書き\",\"テスト\",\"第\",\"二\",\"引数\",\"normal\",\"search\",\"extended\",\"指定\",\"デフォルト\",\"normal\",\"モード\"]","[\"を\",\"使う\",\"た\
 
",\"の\",\"テスト\",\"です\"]","[\"日本\",\"経済\",\"新聞\",\"関西\",\"国際\",\"空港\"]","[smartcn,","add","addition,","additional.hive;","all,","allow","amazon","apach","apach,","apis,","argument","array","array(","array(\"kuromoji\"),","array(\"名詞","basic","boolean","chines","const","core/src/test/resources/userdict.txt\");","custom","ddl","default","defin","dependencies.jar.","dependencies.jar;","detail","dictionari","each","effort","enabl","english","example,","explicitli","extern","false)","fifth","file","file,","first","follow","follows.","follows:","format:","foundat","fourth","hivemal","ictcla,","ignor","includ","incub","incubator.","indic","input,","issu","japanes","japaneseanalyz","jar","java,","javadoc","kuromoji","kuromoji'","kuromoji.","larg","later.","line,","list","mode","modul","module.","moreover,","need","nlp","non","note","notetokenize_ja","noun","null","null,","offici","option","pass","pleas","provid","queri","rc.1","refer","regist","respect
 
","s3:","select","signatur","simpl","simpli","smartchineseanalyz","smartchineseanalyzer.","softwar","somewher","sourc","sponsor","stop","stoptags,","stopwords)","stopwords,","string","support","syntax:","tag):","tags.","text","third","token","tokenize(text","tokenize_cn(\"smartcn为apache2.0协议的开源中文分词系统,java语言编写,修改的中科院计算所ictclas分词系统。\");","tokenize_cn(str","tokenize_ja(\"kuromojiを使った分かち書きのテストです。\",","tokenize_ja(\"kuromojiを使った分かち書きのテストです。第二引数にはnormal/search/extendedを指定できます。デフォルトではnormalモードです。\");","tokenize_ja(\"日本経済新聞&関西国際空港\",","tokenize_ja(text","tolowercas","udf","undergo","url","us","usag","user","userdict","userdict)","userdicturl","v0.4.1,","v0.5","well.","word","word)","xxx","クウコウ,テスト名詞\"","ケイザイ","コクサイ","シンブン,カスタãƒ
 åè©ž\",",
 
"一般\"));","中文,","中科院,","为,","修改,","分词,","协议,","国際","开源,","所,","新聞,ニホン","的,","空港,カンサイ","系统,","系统]","経済","编写,","计算,","语言,"],"misc/approx.html":["'","(asf),","14')","15","15')","16')","24')","25","25')","38033066","4')","45051015","45567770","45614484","45831359","45832280","45840617","49332600","6","6')","[","[4,32]","[4,sp]","]","`p`","`sp`","accur","actual","actual,","aggreg","algorithm","apach","approx_count_distinct","approx_count_distinct(rowid)","approx_count_distinct(rowid,","approx_count_distinct.","approxim","better","cardin","caus","consumpt","control","count","count(distinct","data","defaul","default","default_p","distinct","effici","effort","element","error","exhaust","expect","expression),","find","follows:","foundat","function","gener","help","help')","help]","hivemal","hllevalu","huge","hyperloglog","hyperloglog++","implement","incub","incubator.","inform","input","input.","large.","le
 
ss","memori","more","multiset.","normal","notep","number","option","p","p14","p14,","p15","p15,","p15_sp15","p16","p16,","p24","p24,","p25","p25,","p4","p4,","p6_sp6","p6_sp6,","p=15","paper.","perform","precis","rang","regist","rowid)","select","set.","show","signatur","size","softwar","sp","spars","sponsor","tradeoff","train;","undergo","us","usag","usage:","valu","value)","well.","work"],"ft_engineering/scaling.html":["\":\",","\"age\"","\"balance\"","\"campaign\"","\"day\"","\"duration\"","\"pdays\"","\"previous\"","${max_target})","${mean_target},","${min_target},","${stddev_target})","'banana:0.5'))","(","(asf),","(t1.featur",")","),","...","0,","0.51940954","0.51940954;","0.6278076335455348","1","1,","2","3","3.566241460963296","3.566241460963296;","3;","7.899578","7.899578;",";","=","[\"apple:0.6666667\",\"banana:0.33333334\"]","[\"apple:0.8944272\",\"banana:0.4472136\"]","[\"reflectance:0.5252967\",\"specific_heat:0.19863537\",\"weight:0.0\"]","[\"reflectance:0.5950446\",\"
 
specific_heat:0.09166764\",\"weight:0.052084323\"]","[\"reflectance:0.6797837\",\"specific_heat:0.12567581\",\"weight:0.13255163\"]","[\"weight:69.613\",\"specific_heat:129.07\",\"reflectance:52.111\"]","[\"weight:70.67\",\"specific_heat:128.161\",\"reflectance:52.446\"]","[\"weight:72.303\",\"specific_heat:128.45\",\"reflectance:52.853\"]","ag","apach","appli","avg(target),","avg(value)","balanc","befor","both","campaign","collect_list(","collect_list(feature)","complex","concat(feature,","creat","data.","day","durat","e2006tfidf_test","e2006tfidf_train","e2006tfidf_train;","e2006tfidf_train_sc","each","effort","ensur","explod","explode(features)","extract_feature(feature)","extract_weight(feature)","fals","featur","feature(","feature(feature,","feature,","follow","follows:","foundat","fv","group","hivemal","hivevar:max_target=","hivevar:mean_target=","hivevar:min_target=","hivevar:stddev_target=0.6278076335455348;","http://en.wikipedia.org/wiki/feature_scaling#resc","http://en.wik
 
ipedia.org/wiki/standard_scor","id,","if(pday","if(t1.minmax,rescale(t1.value,","incub","incubator.","join","l1","l1/l2","l1_normalize(array('apple:1.0',","l2","l2_normalize(array('apple:1.0',","later","length:","limit","max","max(target)","max(value)","mean,","min","min(target),","min(value)","min,","minmax","minmax)","minmax,","more","norm","norm_fv","normal","pdays)","previou","quant","quantative_norm","quantative_stat","replac","rescale(t1.value,","rescale(target,","rowid","rowid,","scale","select","set","softwar","sponsor","stat","stddev","stddev,","stddev_pop(target)","stddev_pop(value)","t1","t1.feature,","t1.id","t1.id,","t2","t2.feature)","t2.max)","t2.max),zscore(t1.value,","t2.mean,","t2.min,","t2.stddev)","t2.stddev))","t;","tabl","target","target,","tip","train","train_norm","true","undergo","union","unit","us","v0.3.2","valu","vector","view","zscore","zscore(t1.value,","zscore(target,","zscore)"],"ft_engineering/hashing.html":["\"movieid#2331\"));","(2^24).","(2^24)]",
 
"(a.k.a.","(asf),","(it'","(or","+1'd","0","1","1.","10');","16777216","16777217","2","2746618","2;","3');","3874068","4063537","9566153","[","[\"11293631\",\"3322224\",\"4331412\"]","[\"11293631:0.1\",\"3322224:0.2\",\"4331412:0.3\"]","[\"1803454\",\"6630176\"]","[\"1828616\",\"6238429\"]","[\"1828616:3.3\",\"6238429:4.999\",\"6238429\"]","[\"4063537\",\"8459207\"]","[\"4063537:1.0\",\"4063537\",\"8459207:2.0\"]","[\"7\",\"1\"]","[\"userid#4505\",\"movieid#2331\"]","[\"userid#5689\",\"movieid#3072\"]","[,","[default:","]","alway","apach","appli","array","bia","clause.","consid","const","control","default","describ","differ","effort","element","examples.","extend","featur","feature_hash","feature_hashing('aaa');","feature_hashing('aaa','","feature_hashing(array","feature_hashing(array(\"userid#4505:3.3\",\"movieid#2331:4.999\",","feature_hashing(array('1','2','3'));","feature_hashing(array('1:0.1','2:0.2','3:0.3'));","feature_hashing(array('aaa','bbb'));","feature_hashing(array('aaa
 
','bbb'),'","feature_hashing(array('aaa:1.0','aaa','bbb:2.0'));","feature_hashing(array(1,2,3));","feature_hashing(features),","feature_hashing(null,'","features)","features,","features.","find","follow","foundat","function","functions.","hash","help","help');","help]","hivemal","hivevar:num_features=16777216;","hivevar:num_features=1;","incub","incubator.","int","limit","mhash","mhash('aaa');","mhash('aaa',${num_features});","mhash('aaa:2.0');","mhash(array('aaa','bbb'));","mhash(array('bbb','aaa'));","mhash(str","mhash;","murmurhash3","never","note:","noteth","num_featur","number","number).","option.","options])","order","reserv","return","scalar","select","sentitive.","set","show","softwar","sponsor","start","string","support","system","through","training_fm","trick)","undergo","usage:","valu","value.","values.","vector","word)"],"ft_engineering/selection.html":["#features)","${k})","(","(#classes,","(1,","(\\sigma_{1}","(asf),","(chi2)","(n_class,","(n_classes,","(snr)","(x.#col
 
s,",")","),",");","+","/","1)","2)","3)","=","[udaf]","[udf]","\\mu_{2}|","\\sigma_{2})∣μ​1​​−μ​2​​∣/(σ​1​​+σ​2​​),","aggreg","algorithm","apach","appli","array","array)","array,","array>","array>,","array_avg(y)","array_sum(x)","articl","base","best","between","binar","binari","both","chi","chi2","chi2(observed::array>,","chi2(r.observed,","class","class_prob","classif","classification.","clearly,","col","construction.","creat","criterion","cross","defin","details.","deviat","dot","dot(class_prob.t,","dot(x.t,","each","effort","element","even","events.","expect","expected::array>)::struct,","featur","feature_count)","feature_count,","features,","foundat","function","hivemal","hivevar:k=2;","hot","import","importance_list","importance_list::array,","improv","incub","incubator.","independ","input","int","join","k","k::int)::array","kkk,","kkk.","know","l","l.expected)","label","larger","later.","list","mathemat","matrix","mean","metric,","model","n_c
 
lass","n_featur","n_features)","nois","note:","number","observ","observed,","omit","on","output","p","predict","prediction.","problems.","process","product","r","r.v.chi2,","r;","rank","ratio","rc.1","redund","refer","relev","result","row","score","select","select_k_best(l.x,","select_k_best(x,","select_k_best(x::array,","selection.","set","shape","shorten","signal","signatur","snr","snr(x,","snr(x::array,","snr,","snr;","softwar","sponsor","squar","standard","stat","statist","statistics,","struct,","subset","support","tabl","target","techniqu","test","time,","top","train","transpose_and_dot(class_prob,","transpose_and_dot(x::array,","transpose_and_dot(y,","two","undergo","univari","us","usag","v","v0.5","valu","variabl","vector","vector,","x","x)","y","y)","y.#cols)","y::array)::array","y::array)::array>","μk\\mu_{k}μ​k​​","σk\\sigma_{k}σ​k​​","χ2\\chi^2χ​2​​","∣μ1−μ2∣/(σ1+σ2)|\\mu_{1}"],"ft_engineering/binning.html":["'female'),","'female');","'ge
 
nder'),","'male'),","(","('emma',","('ethan',","('isabella',","('jacob',","('mason',","('noah',","('sophia',","(asf),","(bin","(user",")","),",");","0","1","15","15,","2","20","20,","22","22,","3)","3))","35","35,","46","46,","55","55,","=","[\"name#emma\",\"gender#female\",\"age:0\"]","[\"name#ethan\",\"gender#male\",\"age:2\"]","[\"name#isabella\",\"gender#female\",\"age:1\"]","[\"name#jacob\",\"gender#male\",\"age:1\"]","[\"name#mason\",\"gender#male\",\"age:1\"]","[\"name#noah\",\"gender#male\",\"age:2\"]","[\"name#sophia\",\"gender#female\",\"age:2\"]","[auto_shrink:","[udaf]","[udf]","a.","ag","age,","age:int","apach","appli","array","array('age'),","array('name',","array_concat(","auto_shrink","auto_shrink])","b","b.","behavior","bin","bin:","bins.","bins;","boolean","build_bins(age,","build_bins(weight,","categor","categorical_features(","col","creat","cross","data","data.","defin","divid","duplic","effort","entry::","exception.","f=>except","false]","featur","feature_binnin
 
g(age,","feature_binning(features,","features:","few","first","follows:","foundat","function","gender","group","hivemal","id)","incub","incubator.","input","insert","int","int,","int|bigint|float|doubl","join","key:","later.","mani","map","map('age',","map>","method","name","name,","not,","note:","notether","num_of_bin","num_of_bins:","num_of_bins[,","number","output","possibl","pre","prepar","quantil","quantiles)","quantiles.","quantiles:","quantiles_map","quantiles_map)","quantiles_map)/(weight,","quantiles_map:","quantit","quantitative_features(","rc.1","repeat","repeated:","result","sampl","select","separ","serial","signatur","skip","softwar","sponsor","string","string,","support","t","t=>skip,","tabl","table)","throw","trasform","true,","undergo","usag","user","v0.5","val:","valu","values.","variabl","variation:","vector","weight","weight:"],"ft_engineering/pairing.html":["(asf),","apach","effort","featur","foundat","hivemal","incub","incubator.","pare","softwar","sponsor","und
 
ergo"],"ft_engineering/polynomial.html":["\"c:0.3\"),","(asf),",")","+","2);","3);","3,",">","[\"a:0.5\",\"a^2:0.25\",\"a^3:0.125\",\"b:0.2\",\"b^2:0.040000003\",\"b^3:0.008\"]","[\"a:0.5\",\"a^a:0.25\",\"a^a^a:0.125\",\"a^a^b:0.05\",\"a^b:0.1\",\"a^b^b:0.020000001\",\"b:0.2\",\"b^b:0.040000003\",\"b^b^b:0.008\"]","[\"a:0.5\",\"a^a:0.25\",\"a^a^a:0.125\",\"a^a^b:0.25\",\"a^a^c:0.075\",\"a^b:0.5\",\"a^b^b:0.5\",\"a^b^c:0.15\",\"a^c:0.15\",\"a^c^c:0.045\",\"b:1.0\",\"b^b:1.0\",\"b^b^b:1.0\",\"b^b^c:0.3\",\"b^c:0.3\",\"b^c^c:0.09\",\"c:0.3\",\"c^c:0.09\",\"c^c^c:0.027000003\"]","[\"a:0.5\",\"a^a:0.25\",\"a^a^a:0.125\",\"a^a^c:0.075\",\"a^c:0.15\",\"a^c^c:0.045\",\"b:1.0\",\"c:0.3\",\"c^c:0.09\",\"c^c^c:0.027000003\"]","[\"a:0.5\",\"a^a:0.25\",\"a^b:0.1\",\"b:0.2\",\"b^b:0.040000003\"]","[\"a:0.5\",\"a^b:0.1\",\"a^b^c:0.030000001\",\"a^c:0.15\",\"b:0.2\",\"b^c:0.060000002\",\"c:0.3\"]","[\"a:0.5\",\"a^b:0.1\",\"b:0.2\"]","[\"a:0.5\",\"a^b:0.5\",\"a^b^c:0.15\",\"a^c:0.15\",\"b:1.0\",\"b^
 
c:0.3\",\"c:0.3\"]","[\"a:0.5\",\"a^c:0.15\",\"b:1.0\",\"c:0.3\"]","[,","allow","apach","assum","becom","boolean","cautionpolynomi","combinations.","degre","easili","effort","elimin","false);","false,","featur","features,","features.","foundat","function","gener","hivemal","incub","incubator.","inf","inf/","input","int","interact","interactiononly=false,","large.","learn,","linear","model.","n","non","normal","note:","on","polynomi","polynomial_feature(array","polynomial_features(array(\"a:0.5\",\"b:0.2\"),","polynomial_features(array(\"a:0.5\",\"b:0.2\",\"c:0.3\"),","polynomial_features(array(\"a:0.5\",\"b:1.0\",","polynomial_features(array(\"a:0.5\",\"b:1.0\",\"c:0.3\"),","power","powered_features(array","powered_features(array(\"a:0.5\",\"b:0.2\"),","regression/classif","scikit","select","similar","softwar","sponsor","true);","true,","truncat","truncate=true]","truncate=true])","undergo","unnecessari","us","x**n"],"ft_engineering/ft_trans.html":["(asf),","apach","effort","featur"
 
,"foundat","hivemal","incub","incubator.","softwar","sponsor","transform","undergo"],"ft_engineering/vectorization.html":["(a","(asf),",")","*","...)","1","1.0","1.0\",\"poutcome#unknown\"]","2","2;",">",">[\"a:0.2\",\"b:0.3\"]","[\"a:0.2\",\"b:0.3\",\"bool:1.0\"]","[\"a:0.2\",\"b:0.3\",\"weather#sunny\"]","[\"a:0.2\"]","[\"a:1.0\"]","[\"age:39.0\",\"job#blu","[\"age:51.0\",\"job#entrepreneur\",\"marital#married\",\"education#primary\",\"default#no\",\"balance:1443.0\",\"housing#no\",\"loan#no\",\"contact#cellular\",\"day:18.0\",\"month#feb\",\"duration:172.0\",\"campaign:10.0\",\"pdays:","age,job,marital,education,default,balance,housing,loan,contact,day,month,duration,campaign,pdays,previous,poutcom","apach","array","array(\"age\",\"job\",\"marital\",\"education\",\"default\",\"balance\",\"housing\",\"loan\",\"contact\",\"day\",\"month\",\"duration\",\"campaign\",\"pdays\",\"previous\",\"poutcome\"),","avoid","boolean","categor","collar\",\"marital#married\",\"education#secondary\
 
",\"default#no\",\"balance:1756.0\",\"housing#yes\",\"loan#no\",\"contact#cellular\",\"day:3.0\",\"month#apr\",\"duration:939.0\",\"campaign:1.0\",\"pdays:","column","dual;","each","effort","exampl","featur","featurenames,","features,","foundat","gener","hivemal","id,","incub","incubator.","limit","name)","row,","select","softwar","sponsor","tabl","table.","train","treat","true","undergo","us","valu","vector","vectorize_feature(array","vectorize_features(","vectorize_features(array(\"a\"),*)","vectorize_features(array(\"a\",\"b\"),\"0.2\",\"0.3\")","vectorize_features(array(\"a\",\"b\"),\"0.2\",0)","vectorize_features(array(\"a\",\"b\",\"bool\"),0.2,0.3,true)","vectorize_features(array(\"a\",\"b\",\"weather\"),\"0.2\",\"0.3\",\"sunny\")","w/","weight","y","zero"],"ft_engineering/quantify.html":["${output_row},","(","(asf),","(id,",")","*","*)","0","1","1,0,pdays),","10","102","1028","1029","10;","121","1294","13","14","140","1443","1466","150","16","172","1756","176","18","181","181
 
5","185","2","20","230","235","24","25","26","260","266","27","29","295","3","30","31","32","324","34","354","36","37","38","39","4","404","41","423","426","43","436","442","474","476","476,0,0,1,27,5,92,4,0,0,0]","486","5","502","51","52","54","567","572","572,0,1,1,5,3,26,24,0,0,0]","574","595","6","62","6217","63","7","707","8","895","9","908","92","939","[1.0,39.0,0.0,0.0,0.0,0.0,1756.0,0.0,0.0,0.0,3.0,0.0,939.0,1.0,0.0,0.0,0.0,1.0]","[10.0,32.0,7.0,1.0,2.0,0.0,1815.0,1.0,0.0,2.0,10.0,6.0,235.0,1.0,6.0,2.0,1.0,1.0]","[2.0,51.0,1.0,0.0,1.0,0.0,1443.0,1.0,0.0,0.0,18.0,1.0,172.0,10.0,0.0,0.0,0.0,1.0]","[3.0,36.0,2.0,1.0,2.0,0.0,436.0,1.0,0.0,0.0,13.0,0.0,567.0,1.0,1.0,2.0,1.0,1.0]","[30,2,1,2,0,1028,1,0,0,4,1,1294,2,0,0,0]","[32,2,0,0,0,6217,0,1,0,18,9,486,2,181,2,1]","[34,5,1,0,0,","[37,1,0,1,0,62,1,0,0,31,8,404,2,0,0,0]","[38,5,1,2,0,","[39,7,1,2,0,426,1,0,1,18,3,1029,1,0,0,0]","[4.0,63.0,3.0,0.0,0.0,0.0,474.0,1.0,0.0,0.0,25.0,2.0,423.0,1.0,0.0,0.0,0.0,1.0]","[41,0,0,0,0,121,0,0,
 
0,13,5,16,6,176,5,3]","[43,4,0,1,0,574,0,0,0,8,5,140,1,0,0,0]","[5.0,31.0,2.0,1.0,2.0,0.0,354.0,1.0,0.0,0.0,30.0,0.0,502.0,1.0,2.0,2.0,2.0,1.0]","[52,8,0,1,0,1466,1,1,0,20,9,150,1,0,0,0]","[54,5,0,0,0,324,0,0,2,13,5,51,1,0,0,0]","[6.0,29.0,0.0,1.0,0.0,0.0,260.0,0.0,0.0,1.0,2.0,3.0,707.0,14.0,0.0,0.0,0.0,1.0]","[7.0,37.0,4.0,0.0,0.0,0.0,52.0,0.0,0.0,0.0,6.0,4.0,908.0,1.0,3.0,9.0,2.0,1.0]","[8.0,32.0,5.0,1.0,0.0,0.0,230.0,0.0,0.0,0.0,18.0,5.0,442.0,1.0,4.0,8.0,1.0,1.0]","[9.0,31.0,6.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,5.0,895.0,2.0,5.0,2.0,1.0,1.0]","admin.","ag","age,","apach","apr","array(age,","asc","aug","balanc","balance,","blue","campaign","campaign,","cast(pday","cellular","collar","column","contact","contact,","dataset","day","day,","default","default,","desc","durat","duration,","educ","education,","effort","employ","entrepreneur","failur","fals","featur","feb","forc","foundat","hivemal","hivevar:output_row=true;","hous","housemaid","housing,","id","id,","if(pdays==","incub","i
 
ncubator.","index","int","jan","job","job,","jul","jun","later.","limit","loan","loan,","manag","marit","marital,","marri","month","month,","non","note:","nov","number","numbers.","order","output_row,","pday","pdays,","poutcom","poutcome)","poutcome,","previou","previous,","primari","quantifi","quantified_featur","quantified_features(","quantify(","quantify(${output_row},","quantify()","reduc","retir","run","secondari","select","self","sep","servic","set","singl","softwar","sponsor","string","string),","success","support","t","t0","t1","t2","technician","telephon","tertiari","test","train","train;","train_first,","transform","true","undergo","union","unknown","us","v0.4","valu","y","y)","ye"],"ft_engineering/tfidf.html":["\":\",","\"realm:0.03282491756638329\",\"divided:0.03282491756638329\",\"concepts:0.03282491756638329\",\"attainment:0.032824","${n_docs})","&","'/home/myui/tmp/tfidf_test.tsv'","'|'","(","(asf),","(docid,","(docid,word)","(log(10,","(tf.word",")","*","+","...",".0
 
4200326112968063\",\"judgement:0.035169554338885474\",\"apply:0.035169554338885474\",\"disposition:0.035169554338","0.014001086678120098","0.017584777169442737","0.03282491756638329\",\"moral:0.03282491756638329\",\"numerous:0.03282491756638329\",\"philosophical:0.032824917566","0.06564983513276658","0.07033910867777095","0.09484606645205085","0.12","0.13","0.1641245850805637","1","1,","1.0)","1.0);","2","2,","3","38329\",\"application:0.03282491756638329\",\"perspectives:0.03282491756638329\",\"procedural:0.03282491756638329\",","56638329\",\"equity:0.03282491756638329\",\"includes:0.03282491756638329\",\"theology:0.03282491756638329\",\"ethics:","64983513276658\",\"based:0.06564983513276658\",\"religion:0.06564983513276658\",\"viewpoints:0.03282491756638329\",\"","82491756638329\",\"rightness:0.03282491756638329\",\"general:0.03282491756638329\",\"many:0.03282491756638329\",\"dif","885474\",\"given:0.035169554338885474\"","91756638329\",\"fields:0.03282491756638329\",\"often:0.026
 
135361945200226\",\"philosophy:0.026135361945200226\",\"stu","=","[\"action:0.07033910867777095\",\"wisdom:0.05275433288400458\",\"one:0.05275433288400458\",\"understanding:0","[\"justice:0.1641245850805637\",\"found:0.06564983513276658\",\"discussion:0.06564983513276658\",\"law:0.065","abov","act","action","apach","appropri","befor","beta3","calcul","cast(${n_docs}","cast(n_doc","cd","collect_all(concat(word,","collect_list(concat(word,","collect_list(feature(word,","compos","comput","consid","consist","count(distinct","creat","data","defin","delimit","desc;","df","df.docs,","df.word)","df_t","discuss","doc","docid","docid)","docid,","docid/word","docid;","document","document_frequ","download","dy:0.026135361945200226\"]","each","effort","entri","experi","explain","explode(tokenize(page,true))","explode(word2freq)","extern","featur","fering:0.03282491756638329\",\"fairness:0.03282491756638329\",\"social:0.03282491756638329\",\"broadest:0.032824917","field","find","float)/max2(1,df.
 
docs))","float)/max2(1,df_t))","float,","follows:","format","found","foundat","freq","freq;","group","hive","hive/hivemall.","hivemal","hivevar:n_docs=3;","https://gist.githubusercontent.com/myui/190b91a3a792ccfceda0/raw/327acd192da4f96da8276dcdff01b19947a4373c/tfidf_test.tsv","idf","idf(df_t","idf,","if(x>y,x,y);","incub","incubator.","inpath","int)","int,","is_stopword(word);","join","justic","justice,","knowledg","knowledge,","later","later.","law","link.","load","local","macro","max2(x","n_doc","need","notethi","number","order","page","pair","pair,","prepar","query.","rationality:0.03282491756638329\",\"including:0.03282491756638329\",\"context:0.03282491756638329\",\"concept:0.032","relat","religion","replac","respectively.","result","row","select","set","softwar","sponsor","store","string","support","t","t2","tabl","table/view","temporari","term_frequ","termin","textfile;","tf","tf(word)","tf.docid,","tf.freq","tf.word,","tf/df","tfidf","tfidf(tf","tfidf(tf.freq,","tfidf))","t
 
otal","tuples.","undergo","us","v0.3","v0.3.4","valu","vector","view","views,","virtu","well","wget","wikipag","wikipage;","wikipage_explod","wikipedia","willing","wisdom,","word","word)","word,","word2freq","word;","y","~/tmp"],"eval/binary_classification_measures.html":["\"matched\"","'","(1+\\beta^2)","(:","(asf),","(fn):","(fp):","(int","(tn):","(tp):","*","+","0","0.4","0.45454545454545453","0.5","0/1","1","1.0,","2","2.","4",";","=","\\frac{1}{2}precision=​2​​1​​.","\\frac{1}{3}precision=​3​​1​​.","\\frac{\\mathrm{\\#tp}","\\frac{\\mathrm{\\#tp}}{\\mathrm{\\#tp}","\\frac{\\mathrm{precision}","\\mathrm{\\#fn}","\\mathrm{\\#fn}}","\\mathrm{\\#fp}","\\mathrm{\\#fp}}","\\mathrm{\\#tn}}","\\mathrm{\\#tn}}{\\mathrm{\\#tp}","\\mathrm{f}_1","\\mathrm{f}_{\\beta}","\\mathrm{precision}","\\mathrm{recall}","\\mathrm{recall}}","\\mathrm{recall}}{\\beta^2","\\mathrm{recall}}{\\mathrm{precision}","abov","advertis","apach","appropriate.","area","argument","argument.","arr
 
ay(predicted))","article.","averag","average,","average.","base","beta","between","binari","binary')","boolean).","calcul","case","case,","categories.","cautionhivemal","center","classif","classifi","classification'","classification,","click","column","comput","consid","correct","count","creat","curv","data","data;","deal","default","descript","detail","determin","each","effort","element","equation:","equival","evalu","exampl","example,","examples,","explanation.","extern","f","f1","f1=2precision∗recallprecision+recal","f1score","f1score(array(truth),","f1score(truth,","fals","fmeasur","fmeasure(truth,","fn","fn:","focus","follow","follows:","foundat","fp","fp:","function","function,","fβ=(1+β2)precision∗recallβ2precision+recal","f​1​​=2​precision+recall​​precision∗recall​​","f​β​​=(1+β​2​​)​β​2​​precision+recall​​precision∗recall​​","gener","given","hand,","harmon","hivemal","hivemall'","ignor","illustr","includ","incorrect"
 
,"incub","incubator.","indic","information.","int,","introduc","know","label","label,","label.","labels,","labels.","larger","learn","learn'","leftmost","mean","measur","metric","metrics,","micro","micro')","micro'.","micro(default)","modifi","more","neg","negative.","new","note","number","obtain","old","omitted,","ones.","onlin","operation.","option","output","page","paramet","pass","pleas","posit","precis","precision.","precision=#tp#tp+#fp","precision=#tp+#tn#tp+#fp+#tn","precision=12\\mathrm{precision}","precision=13\\mathrm{precision}","precision=​#tp+#fp+#tn​​#tp+#tn​​","precision=​#tp+#fp​​#tp​​","predict","predicted)","predicted,","prediction.","preliminari","previou","probabl","problem","problems.","provid","queri","rate","reach","recal","recall.","recall=#tp#tp+#fn","recall=#tp+#tn#tp+#fn+#tn","recall=​#tp+#fn+#tn​​#tp+#tn​​","recall=​#tp+#fn​​#tp​​","recommend","repres","resource:","roc","row","same","sampl","scikit","score","score)
 
.","score.","select","set","sever","show","simpli","smaller","so,","softwar","special","sponsor","such","switch","tabl","table.","task","that,","those","tn","tn:","to:","toy","tp:","tr","true","truth","truth,","tutori","two","type","under","undergo","union","us","valu","value'","value:","values:","want","weight","wikipedia","β=1\\beta=1β=1","β=1\\beta=1β=1.","β=2\\beta=2β=2","β\\betaβ"],"eval/auc.html":["(","(asf),","(auc)","(i.e.,","(label=0)","(label=1)","(rows)",")","/","0","0.2","0.2)","0.3","0.5","0.54001","0.7","0.8","0.83333","1","1]","5","[0,","abov","above,","above:","allow","anoth","apach","approxim","area","assum","auc","auc(doubl","auc(prob,","auc.","base","better.","between","bin","binari","both","call","case.","classif","classifi","classification.","claus","column","compar","comput","contain","curv","data","desc","descend","differ","distribut","effort","evalu","example,","floor(prob","follow","follows:","foundat","function","gener","give","hand,","henc","higher
 
","hive'","hivemal","hivemall,","incub","incubator.","input","instance,","int","label","label)","label.","labels.","large,","larger","logarithm","logist","logloss(prob,","loss","mani","mean","meanwhile,","mention","metric","need","neg","negative)","node","note","now","on","onc","one.","order","order,","order.","pair","pairs.","parallel","parallel:","perform","posit","positive/neg","predict","prob","prob,","probabilities)","probability(predict","probability.","probabl","problem","produc","provid","queri","range.","rank","regression.","rel","respect","return","roc","row","rows,","sampl","samples.","score","score)","score,","select","sequenti","shown","simpli","singl","smaller","softwar","sort","sponsor","such","t;","tabl","truth","ultimately,","under","undergo","union","us","way","well.","wide"],"eval/multilabel_classification_measures.html":["\"bird\")","\"cat\")","\"dog\")","\"dog\",","'","(","(1+\\beta^2)","(:","(\\sum_i","(asf),","(no",")","+","0.6779661016949152","0.6956521739130
 
435","0≤li≤∣l∣0","1.0,","2","2*","2.')",";","=","\\beta^2","\\cap","\\frac","\\leq","\\mathrm{f}_1","\\mathrm{f}_{\\beta}","\\sum_i","actual,","anim","apach","array(\"bird\")","array(\"bird\",","array(\"cat\")","array(\"cat\",","array(\"dog\")","array(\"dog\",","array()","article.","base","beta","bird","bird,","blog","calcul","case","cat","cat,","categories.","cautionhivemal","classif","classification'","classifier.","column","comput","data","dataset","dataset,","defin","determin","document.","dog","dog,","each","effort","equation:","equival","evalu","exampl","explanation.","f","f1","f1=2∑i∣li∩pi∣2∗∑i∣li∩pi∣+∑i∣li−pi∣+∑i∣pi−li∣","f1score","fmeasur","fmeasure(actual,","focus","follow","foundat","function","function,","fβ=(1+β2)∑i∣li∩pi∣β2(∑i∣li∩pi∣+∑i∣li−pi∣)+∑i∣li∩pi∣+∑i∣pi−li∣","f​1​​=2​2∗∑​i​​∣l​i​​∩p​i​​∣+∑​i​​∣l​i​​−p​i​​∣+∑​i​â
 
€‹âˆ£p​i​​−l​i​​∣​​∑​i​​∣l​i​​∩p​i​​∣​​","f​β​​=(1+β​2​​)​β​2​​(∑​i​​∣l​i​​∩p​i​​∣+∑​i​​∣l​i​​−p​i​​∣)+∑​i​​∣l​i​​∩p​i​​∣+∑​i​​∣p​i​​−l​i​​∣​​∑​i​​∣l​i​​∩p​i​​∣​​","gener","given","ground","hand,","harmon","hivemal","iii","incub","incubator.","introduc","l_i","l_i|","l_i|}","label","label)","labels,","larger","left","lil_il​i​​","lll","manner,","mean","measur","measure.","metric","micro","more","multi","name","obtain","old","omitted,","operation.","p_i","p_i|","p_i|)","page","paramet","pip_ip​i​​","posit","post","posts,","posts.","precision.","predict","predicted)","predicted,","prediction.","problem","problems.","provid","queri","reach","recal","recall.","recommend","repres","right","same","sampl","score","score).","score.","select","set","show","smaller","so,","
 
softwar","special","sponsor","such","suppos","tabl","tag","task","th","toy","truth","two","undergo","union","uniqu","us","valu","weight","{","{\\sum_i","|","|l_i","|l|0≤l​i​​≤∣l∣.","|p_i","|}","}","β=1\\beta=1β=1","β=1\\beta=1β=1.","β=2\\beta=2β=2.","β\\betaβ"],"eval/regression.html":["${mean_actual},2.0))","(","(asf),","(r^2)",")","/","0","0.01","0.02","0.14852283792484033","0.2466732002711477","0.38538660838804495","0.48623913673053565","1","1.9610366706408238","3.8200363760415414","3.8200363760415414;","3.9124877451612488","absolut","actual)","actual))/count(1)","actual)*ln(1","actual,","actual,2.0))/count(1)","actual,2.0))/count(1))","alpha.5","apach","avg(actual),","avg(predicted)","coeffici","comput","determin","e2006","e2006tfidf_pa2a_submit;","effort","error","evalu","example,","explain","follows:","foundat","hive.","hivemal","hivevar:mean_actual=","http://en.wikipedia.org/wiki/coefficient_of_determin","https://www.kaggle.com/wiki/metr","incub","incubat
 
or.","logarithm","logloss(predicted,","logloss1,","logloss2","loss","mae(predicted,","mae,","mean","metric","model","mse(predicted,","mse,","predict","predicted)","predicted))/count(1)","predicted,2.0))","r2","r2(actual,","rc.1","refer","regress","rmse(predicted,","rmse,","root","score","select","set","softwar","sponsor","sqrt(sum(pow(predict","squar","sum(abs(predict","sum(actual*ln(predicted)+(1","sum(pow(actu","sum(pow(predict","support","t","t;","tfidf","undergo","union","us","v0.4.1","v0.4.2"],"eval/rank.html":["\"","&","'","(","(1","(2^{\\mathrm{rel}_n}","(\\mathrm{otherwise})","(asf),","(auc)","(i+,i−)(i^+,","(i.e.,","(i_n","(itemid","(map)","(max_k)","(mrr)","(n","(ndcg)","(precision@k)","(recall@k)","(scores)","(t1.userid","(the","(userid",")",")(i​+​​,i​−​​)","),","+",",",".","...,","/","0","0.3333333333333333","0.333recall@2=1/3≈0.333.","0.5","0.5555555555555555","0.5precision@2=1/2=0.5","0.6131471927654585","0.613ndcg​2​​=dcg​2​​/idcg​2​
 
​≈0.613.","0.6666666666666666","0.7039180890341349","0.75","0.8128912838590544","0.9187707805346093","1","1)","1,","1.0","1.631idcg​2​​=1/log​2​​2+1/log​2​​3≈1.631.","1/1","1/\\log_2","10.0","1dcg​2​​=1/log​2​​2=1.","1mrr=1/1=1,","1}^{|\\mathcal{i}|}","2","2)","2),","2,","2.0","3","3)","3,","3.0","3\\}i​2​​(u)={1,3}","3\\}u={1,2,3},","4","4)","4,","4.0","4\\}i​u​+​​={1,2,4},","4\\}i​u​+​​={1,2,4}.","5,","5.0","5\\})","6","6,","6.0","6\\}i={1,2,3,4,5,6}","8.0",";","=","=>",">","[","[1,2,4]","[1,3,2,6],","\\\\","\\approx","\\begin{array}{ll}","\\cap","\\cdot","\\end{array}","\\frac{1}{n_{\\mathrm{tp}}}.","\\frac{1}{|\\mathcal{i}^+_u|}","\\frac{2}{3}","\\frac{3}{4}}{3}","\\frac{3}{5}}{3}","\\frac{\\frac{1}{1}","\\frac{\\mathrm{dcg}_k}{\\mathrm{idcg}_k}","\\frac{\\sum_{n=1}^{|\\mathcal{i}|}","\\frac{|\\mathcal{i}^+_u","\\in","\\left[","\\left[i_n","\\left\\{","\\leq","\\log_2(n","\\mathbf{0.756},","\\mathbf{0.806}.","\\mathcal{i}
 
^","\\mathcal{i}^+_u","\\mathcal{i}^+_u)","\\mathcal{i}^+_u\\right]}{\\sum_{n=1}^{|\\mathcal{i}|}","\\mathcal{i}^+_ui​+​​∈i​u​+​​","\\mathcal{i}i​k​​(u)⊂i,","\\mathcal{u}u∈u,","\\mathrm{dcg}_2","\\mathrm{idcg}_2","\\mathrm{map}","\\mathrm{map}(\\mathcal{i}^+_u,","\\mathrm{mrr}","\\mathrm{ndcg}_k","\\mathrm{precision@}k","\\mathrm{precision@}n","\\mathrm{recall@}k","\\mathrm{rel}_n","\\right.","\\right]n​tp​​∈[1,∣i∣],","\\subset","\\sum_{n","\\time","\\{1,","].","_ui​−​​∈i​u​−​​,","_u|∣i​u​+​​∣×∣i​u​−​​∣","abov","above,","above.","accord","accuraci","addit","addition","additionally,","aggreg","allow","altern","and/or","apach","applic","approach","arbitrari","area","argument:","as:","assess","assign","assum","auc","auc(t1.rec,","auc,","auc_at_2,","avail","averag","average_precision(t1.rec,","average_precision,","average_precision_at_2,","base","basically,","be","be:","before.","behind","best","better"
 
,"between","binari","built","by:","case","cast(count(itemid)","cautionbefor","cautionin","chapter,","choic","chosen","classif","collabor","collect_set(itemid)","combin","compar","complet","comput","concept","consid","consist","contain","context","convincing,","correct","correspond","count(itemid)","cover","coverag","creat","cumul","curv","d_k(n)","d_k(n)},","dcg2=1/log22=1\\mathrm{dcg}_2","dcgk\\mathrm{dcg}_kdcg​k​​","demonstr","denot","depict","describ","determin","differ","directli","discount","dk(n)={(2reln−1)/log2(n+1)(1≤n≤k)0(n>k).","done","dummi","dummy_rec","dummy_rec?","dummy_recrel","dummy_truth","duplic","d​k​​(n)={​(2​rel​n​​​​−1)/log​2​​(n+1)​0​​​(1≤n≤k)​(n>k)​​.","each","easi","effici","effort","emphasi","empty.","enabl","equation:","evalu","even","exactli","example,","exist","expect","figur","filter","final","first","fit","fix","focus","follow","follows:","formul","formulation,","foundat","function","gain","gene
 
r","give","grade","group","handl","hence,","here","here,","higher","highest","hive","hivemal","hivemall'","hivemall.","however,","i(u)i(u)i(u)","i(u)i(u)i(u)),","i(u)i(u)i(u),","i+i^+i​+​​","i+∈iu+i^+","i2(u)={1,3}i_2(u)","i2(u)i_2(u)i​2​​(u)","i={1,2,3,4,5,6}\\mathcal{i}","i\\mathcal{i}i,","i^","i_k(u)|}{|\\mathcal{i}^+_u|}.","i_k(u)|}{|i_k(u)|}.","i_k(u)|∣i​u​+​​∩i​k​​(u)∣","i_n","idcg2=1/log22+1/log23≈1.631\\mathrm{idcg}_2","idcgk\\mathrm{idcg}_kidcg​k​​","ik(u)i_k(u)i​k​​(u)","ik(u)i_k(u)i​k​​(u),","ik(u)⊂ii_k(u)","implement","importantly,","incorpor","incub","incubator.","indic","inform","ini_ni​n​​","input","instead","int)","interest","intern","interpret","introduc","inverse:","is,","issu","item","itemid","itemid),","itemid,","items,","items.","items:","iu+={1,2,4}\\mathcal{i}^+_u","iu+\\mathcal{i}^+_ui​u​+​​","iu+\\mathcal{i}^+_ui​u​+​​.","iu+\\mathcal{i}^+_ui​u​+​​;","i​−​​.","i−i
 
^","i−∈iu−i^","join","k","k)","key","key)","key,","key.hence,","keyword","kind","label","later.","latest","launch","lead","learn","length","list","list,","lists.","machin","map","map(iu+,{1,3,2,4,6,5})=11+23+343≈0.806.","map(iu+,{1,3,2,6,4,5})=11+23+353≈0.756,","map(i​u​+​​,{1,3,2,4,6,5})=​3​​​1​​1​​+​3​​2​​+​4​​3​​​​≈0.806.","map(i​u​+​​,{1,3,2,6,4,5})=​3​​​1​​1​​+​3​​2​​+​5​​3​​​​≈0.756,","map.","map=1∣iu+∣∑n=1∣i∣precision@nâ‹
…
[in∈iu+].","map=​∣i​u​+​​∣​​1​​​n=1​∑​∣i∣​​precision@nâ‹
…
[i​n​​∈i​u​+​​].","map_values(to_ordered_map(key,","map_values(to_ordered_map(score,","match","max_k","mean","meanwhile,","measur","measure,","measures,","metric","metric.","more","mpr","mrr","mrr(t1.rec,","mrr,","mrr=1/1=1\\mathrm{mrr}","mrr=1ntp.","mrr=​n​tp​​​​1​​.","mrr_at_2,","much","multipl","n","name","name
 
s.","ndcg","ndcg()","ndcg(t1.rec,","ndcg,","ndcg2=dcg2/idcg2≈0.613\\mathrm{ndcg}_2","ndcg_at_2","ndcgk=dcgkidcgk=∑n=1∣i∣dk(n)[in∈iu+]∑n=1∣i∣dk(n),","ndcg​k​​=​idcg​k​​​​dcg​k​​​​=​∑​n=1​∣i∣​​d​k​​(n)​​∑​n=1​∣i∣​​d​k​​(n)[i​n​​∈i​u​+​​]​​,","newer","nnn","non","normal","notation.","notic","now,","ntp∈[1,∣i∣]n_{\\mathrm{tp}}","number","observations.","obtain","on","order","origin","out","output","over","page","pair","pairs.","pairs:","permutation,","place","portion","posit","positive,","positives.","possibl","potenti","practic","precis","precise,","precision(),","precision().","precision,","precision@1,","precision@2,","precision@2=1/2=0.5\\mathrm{precision@}2","precision@k","precision@k=​∣i​k​​(u)∣​​∣i​u​+​​∩i​k​​(u)∣​​.","precision@k=∣iu+∩ik(u)∣∣ik(u)∣.","precision@∣i∣|\\mathcal{i}|∣i∣,","precision_at()","precis
 
ion_at(t1.rec,","precision_at_2,","prediction:","problem","problem,","problem.","problems.","process","provid","quantit","queri","query:","rank","rc.1","rc.1,","reason","rec","rec,","recal","recall()","recall,","recall@2=1/3≈0.333\\mathrm{recall@}2","recall@k","recall@k,","recall@k=​∣i​u​+​​∣​​∣i​u​+​​∩i​k​​(u)∣​​.","recall@k=∣iu+∩ik(u)∣∣iu+∣.","recall_at()","recall_at(t1.rec,","recall_at_2,","reciproc","recommend","recommendation,","recommendation.","regist","relev","reln={1(in∈iu+)0(otherwise).","reln\\mathrm{rel}_nrel​n​​","reln\\mathrm{rel}_nrel​n​​,","relscore(expected)","rel​n​​={​1​0​​​(i​n​​∈i​u​+​​)​(otherwise)​​.","renam","replac","reserv","respect","respons","responses,","responses.","result","retriev","return","reverse\")","reverse')","roc","s","same","sampl","samples.","score","score(predicted)","score,","second","select","separ","set","setting,","show","simpl","sim
 
pli","singl","six","size","softwar","solv","specifi","sponsor","still","strongli","such","suggest","sum","system,","t1","t1.max_k)","t2","t2.truth,","t2.userid)","tabl","table,","tables,","tackl","take","target","th","that,","three","thus,","to_ordered_list(itemid,","to_ordered_list(relscore,","to_ordered_list(struct(relscore,","to_ordered_list(value,","to_ordered_map()","top","true","true))","true)).","truth","two","u={1,2,3}\\mathcal{u}","under","undergo","unlik","us","usag","user","userid","userid,","u∈uu","v0.5","v2.2.0,","valu","value,","values)","values,","version","way","well","within","words,","zero","|\\mathcal{i}^","|\\mathcal{i}|","∣iu+∣×∣iu−∣|\\mathcal{i}^+_u|","∣iu+∩ik(u)∣|\\mathcal{i}^+_u","∣i∣|\\mathcal{i}|∣i∣."],"eval/datagen.html":["(asf),","apach","data","effort","foundat","gener","hivemal","incub","incubator.","softwar","sponsor","undergo"],"eval/lr_datagen.html":["\"","(","(asf),","(at","(label,features)","(recommended)",")",");","*","0
 
.0","0.044","0.046","0.13126314\",\"190:0.18610542\",\"131:1.7232913\",\"24:","0.19020283\",\"21:","0.54811275\"]","0.5568947\",\"10:0.621897\",\"6:","0.7220096","0.7274741","0.7346627","0.9842969\",\"177:0.062993184\",\"176:","0/1","1","1.0","10","100","100\")","100')","1000","10k","1;","2","2.7551131\",\"113:","2;","5;","9999","[\"139:1.9607254\",\"110:2.958568\",\"186:3.2524762\",\"31:3.9243593\",\"167:0.72854257\",\"26:1.8355447\",\"117:2.7663715\",\"3:2.1551287\",\"179:3.1099443\",\"19:3.6411424\"]","[\"140:2.8347101\",\"165:3.0056276\",\"179:4.030076\",\"112:3.3919246\",\"99:3.98914\",\"16:3.5653272\",\"128:3.046535\",\"124:2.7708225\",\"78:2.4960368\",\"6:1.7866131\"]","[\"34:2.9269936\",\"35:0.37033868\",\"39:3.771989\",\"47:2.2087111\",\"28:2.9445739\",\"55:4.134555\",\"14:2.4297745\",\"164:3.0913055\",\"52:2.0519433\",\"128:2.9108515\"]","[\"73:3.4391513\",\"198:4.42387\",\"164:4.248151\",\"66:3.5224934\",\"84:1.9026604\",\"76:0.79803777\",\"18:2.2168183\",\"163:2.248695\"
 
,\"119:1.5906067\",\"72:2.0267224\"]","[\"84:","[\"84:3.4227803\",\"80:3.8875976\",\"58:3.2909582\",\"123:3.1056073\",\"194:3.3360343\",\"199:2.20207\",\"75:3.5469763\",\"74:3.3869767\",\"126:0.9969454\",\"93:2.5352612\"]","[\"98:4.2451696\",\"4:3.486905\",\"133:2.4589922\",\"26:2.7301126\",\"103:2.6827147\",\"2:3.6198254\",\"34:3.7042716\",\"47:2.5515237\",\"68:2.4294896\",\"197:4.4958663\"]","[4.061373,3.9373128,3.5195694,3.3604698,3.7698417,4.2518,3.8796813,1.6020582,4.937072,1.5513933,3.0289552,2.6674519,3.432688,2.980945,1.8897587,2.9770515,3.3435504,1.7867403,3.4057906,1.2151588,5.0587463,2.1410913,2.8097973,2.4518871,3.175268,3.3347685,3.728993,3.1443396,3.5506077,3.6357877,4.248151,3.5224934,3.2423255,2.5188355,1.8626233,2.8432152,2.2762651,4.57472,2.2168183,2.248695,3.3636255,2.8359523,2.0327945,1.5917025,2.9269936,0.37033868,2.6151125,4.545956,2.0863252,3.7857852,2.9445739,4.134555,3.0660007,3.4279037,2.0519433,2.9108515,3.5171766,3.4708095,3.161707,2.39229,2.4589922,2.730
 
1126,3.5303073,2.7398396,3.7042716,2.5515237,3.0943663,0.41565156,4.672767,3.1461313,3.0443575,3.4023938,2.2205734,1.8950733,2.1664586,4.8654623,2.787029,4.0460386,2.4455893,3.464298,1.062505,3.0513604,4.382525,2.771433,3.2828436,3.803544,2.178681,4.2466116,3.5440445,3.1546876,3.4248536,0.9067459,3.0134914,1.9528451,1.7175893,2.7029774,2.5759792,3.643847,3.0799,3.735559]","apach","array","cl\"","cl\")","classif","count(*)+1","count(1)","creat","data","dataset","dataset.","default","default,","dens","desc","detail","distribut","dual","dual;","dummi","effort","featur","fetched:","find","float","follows:","foundat","gener","generate_series(1,${n_parallel_datagen})","generated.","help').","hive>","hivemal","hivevar:n_parallel_datagen=10;","incub","incubator.","insert","int","label","label.","limit","logist","lr_datagen(\"","lr_datagen('","lrdata1k","lrdata1k;","mapred.reduce.tasks=","mapred.reduce.tasks=${n_parallel_datagen};","max)","multipl","n_dim","n_exampl","n_featur","none","ok","
 
option","option,","parallel","reduc","reducers.","regress","regression_data1","regression_data1;","regression_data_dens","regression_data_dense;","replac","reset","row(s)","run","scalabl","seconds,","seed","select","seq10","seq10;","set","singl","softwar","spars","sponsor","t","tabl","taken:","task","time","undergo","us","value;","view","well"],"supervised_learning/prediction.html":["\"model\"","\"predict","'","(0/1","(\\mathbf{x}_2,","(\\mathbf{x}_n,","(asf),","(i.e.,","(input)","(integer)","(output)","(sgd)","(synonym:","(x1,y1),(x2,y2),⋯,(xn,yn)(\\mathbf{x}_1,","(xi,yi)(\\mathbf{x}_i,","(λ\\lambdaλ","+","...","0","0,","0.005]","0.54,","1","1,","1/1),","10]","17.1","1]","2","2.","21.3","42.195,","6.2",":=","[\"1:0.001\",\"4:0.23\",\"35:0.0035\",...]","[\"1:0.2\",\"3:0.1\",\"13:0.005\",...]","[\"5:1.3\",\"22:0.0.089\",\"77:0.0001\",...]","[default:","\\cdots,","\\frac{1}{n}","\\lambda","\\mathbf{x}_i,","\\sum_{i=1}^{n}","abov","accuracy.","achiev","adadelta","adagrad","adam","a
 
dditionally,","algorithm","anoth","apach","applied.","appropri","articl","as:","assum","auxiliari","avail","base","batch","before,","behav","below","below:","better","binari","briefli","build","call","case","categor","choic","class","classif","classification,","classification.","classifier,","classifiers.","click","combin","condit","configur","construct","construct

<TRUNCATED>

Reply via email to