Feature Vectorization
array<string> vectorize_feature(array<string> featureNames, ...)
is useful to generate a feature vector for each row, from a table.
select vectorize_features(array("a","b"),"0.2","0.3") from dual;
>["a:0.2","b:0.3"]
-- avoid zero weight
select vectorize_features(array("a","b"),"0.2",0) from dual;
> ["a:0.2"]
-- true boolean value is treated as 1.0 (a categorical value w/ its column name)
select vectorize_features(array("a","b","bool"),0.2,0.3,true) from dual;
> ["a:0.2","b:0.3","bool:1.0"]
-- an example to generate feature vectors from table
select * from dual;
> 1
select vectorize_features(array("a"),*) from dual;
> ["a:1.0"]
-- has categorical feature
select vectorize_features(array("a","b","weather"),"0.2","0.3","sunny") from dual;
> ["a:0.2","b:0.3","weather#sunny"]
select
id,
vectorize_features(
array("age","job","marital","education","default","balance","housing","loan","contact","day","month","duration","campaign","pdays","previous","poutcome"),
age,job,marital,education,default,balance,housing,loan,contact,day,month,duration,campaign,pdays,previous,poutcome
) as features,
y
from
train
limit 2;
1 ["age:39.0","job#blue-collar","marital#married","education#secondary","default#no","balance:1756.0","housing#yes","loan#no","contact#cellular","day:3.0","month#apr","duration:939.0","campaign:1.0","pdays:-1.0","poutcome#unknown"] 1 2 ["age:51.0","job#entrepreneur","marital#married","education#primary","default#no","balance:1443.0","housing#no","loan#no","contact#cellular","day:18.0","month#feb","duration:172.0","campaign:10.0","pdays:-1.0","poutcome#unknown"] 1