blob: 7434f4483e890ce3000311a60779e5e768dcbf31 [file] [log] [blame]
\qecho =================================================================
\qecho === Running: mulit-linear regression ============================
\qecho =================================================================
\qecho
\qecho === Refresh table: houses =======================================
DROP TABLE IF EXISTS houses;
CREATE TABLE houses (id INT, tax INT, bedroom INT, bath FLOAT, price INT, size INT, lot INT) distributed by (ID);
COPY houses FROM STDIN DELIMITER '|';
1 | 590 | 2 | 1 | 50000 | 770 | 22100
2 | 1050 | 3 | 2 | 85000 | 1410 | 12000
3 | 20 | 3 | 1 | 22500 | 1060 | 3500
4 | 870 | 2 | 2 | 90000 | 1300 | 17500
5 | 1320 | 3 | 2 | 133000 | 1500 | 30000
6 | 1350 | 2 | 1 | 90500 | 820 | 25700
7 | 2790 | 3 | 2.5 | 260000 | 2130 | 25000
8 | 680 | 2 | 1 | 142500 | 1170 | 22000
9 | 1840 | 3 | 2 | 160000 | 1500 | 19000
10 | 3680 | 4 | 2 | 240000 | 2790 | 20000
11 | 1660 | 3 | 1 | 87000 | 1030 | 17500
12 | 1620 | 3 | 2 | 118600 | 1250 | 20000
13 | 3100 | 3 | 2 | 140000 | 1760 | 38000
14 | 2070 | 2 | 3 | 148000 | 1550 | 14000
15 | 650 | 3 | 1.5 | 65000 | 1450 | 12000
\.
\qecho === Show data sample: ===========================================
select * from houses limit 5;
\qecho === Calculate Coefficients ======================================
select madlib.linregr_coef(price, array[1, bedroom, bath, size])::REAL[] from houses;
\qecho === Calculate R square value ====================================
select madlib.linregr_r2(price, array[1, bedroom, bath, size])::REAL from houses;
\qecho === Calculate t statistics ======================================
select madlib.linregr_tstats(price, array[1, bedroom, bath, size])::REAL[] from houses;
\qecho === Calculate p values ==========================================
select madlib.linregr_pvalues(price, array[1, bedroom, bath, size])::REAL[] from houses;