diff --git a/docs/site/files/dml-language-reference/data.csv b/docs/site/files/dml-language-reference/data.csv new file mode 100644 index 00000000000..0c18568df99 --- /dev/null +++ b/docs/site/files/dml-language-reference/data.csv @@ -0,0 +1 @@ +zipcode,district,sqft,numbedrooms,numbathrooms,floors,view,saleprice,askingprice 95141,south,3002,6,3,2,FALSE,929,934 NA,west,1373,,1,3,FALSE,695,698 91312,south,NA,6,2,2,FALSE,902, 94555,NA,1835,3,,3,,888,892 95141,west,2770,5,2.5,,TRUE,812,816 95141,east,2833,6,2.5,2,TRUE,927, 96334,NA,1339,6,3,1,FALSE,672,675 96334,south,2742,6,2.5,2,FALSE,872,876 96334,north,2195,5,2.5,2,FALSE,799,803 \ No newline at end of file diff --git a/docs/site/files/dml-language-reference/data.csv.mtd b/docs/site/files/dml-language-reference/data.csv.mtd new file mode 100644 index 00000000000..6ddbf26d177 --- /dev/null +++ b/docs/site/files/dml-language-reference/data.csv.mtd @@ -0,0 +1,7 @@ +{ + "data_type": "frame", + "format": "csv", + "sep": ",", + "header": true, + "na.strings": [ "NA", "" ] +} \ No newline at end of file diff --git a/docs/site/files/dml-language-reference/data.spec.json b/docs/site/files/dml-language-reference/data.spec.json new file mode 100644 index 00000000000..d87501759c2 --- /dev/null +++ b/docs/site/files/dml-language-reference/data.spec.json @@ -0,0 +1,24 @@ +{ + "omit": [ "zipcode" ] + ,"impute": + [ { "name": "district" , "method": "constant", "value": "south" } + ,{ "name": "numbedrooms" , "method": "constant", "value": 2 } + ,{ "name": "numbathrooms", "method": "constant", "value": 1 } + ,{ "name": "floors" , "method": "constant", "value": 1 } + ,{ "name": "view" , "method": "global_mode" } + ,{ "name": "askingprice" , "method": "global_mean" } + ,{ "name": "sqft" , "method": "global_mean" } + ] + + ,"recode": + [ "zipcode", "district", "numbedrooms", "numbathrooms", "floors", "view" ] + + ,"bin": + [ { "name": "saleprice" , "method": "equi-width", "numbins": 3 } + ,{ "name": "sqft" , "method": "equi-width", "numbins": 4 } + ] + + ,"dummycode": + [ "district", "numbathrooms", "floors", "view", "saleprice", "sqft" ] + +} \ No newline at end of file diff --git a/docs/site/files/dml-language-reference/data.spec2.json b/docs/site/files/dml-language-reference/data.spec2.json new file mode 100644 index 00000000000..0fa23f4bcb5 --- /dev/null +++ b/docs/site/files/dml-language-reference/data.spec2.json @@ -0,0 +1,23 @@ +{ + "ids": true + ,"omit" : [ 1 ] + ,"impute": + [ { "id": 2, "method": "constant", "value": "south" } + ,{ "id": 4, "method": "constant", "value": 2 } + ,{ "id": 5, "method": "constant", "value": 1 } + ,{ "id": 6, "method": "constant", "value": 1 } + ,{ "id": 7, "method": "global_mode" } + ,{ "id": 9, "method": "global_mean" } + ,{ "id": 3, "method": "global_mean" } + ] + + ,"recode": [ 1, 2, 4, 5, 6, 7 ] + + ,"bin": + [ { "id": 8, "method": "equi-width", "numbins": 3 } + ,{ "id": 3, "method": "equi-width", "numbins": 4 } + ] + + ,"dummycode": [ 2, 5, 6, 7, 8, 3 ] + +} diff --git a/docs/site/files/dml-language-reference/data.spec3.json b/docs/site/files/dml-language-reference/data.spec3.json new file mode 100644 index 00000000000..1b4b355cff3 --- /dev/null +++ b/docs/site/files/dml-language-reference/data.spec3.json @@ -0,0 +1,24 @@ +{ + "omit": [ "zipcode" ] + ,"impute": + [ { "name": "district" , "method": "constant", "value": "south" } + ,{ "name": "numbedrooms" , "method": "constant", "value": 2 } + ,{ "name": "numbathrooms", "method": "constant", "value": 1 } + ,{ "name": "floors" , "method": "constant", "value": 1 } + ,{ "name": "view" , "method": "global_mode" } + ,{ "name": "askingprice" , "method": "global_mean" } + ,{ "name": "sqft" , "method": "global_mean" } + ] + + ,"recode": + [ "zipcode", "district", "numbedrooms", "numbathrooms", "floors", "view" ] + + ,"dummycode": + [ "district", "numbathrooms", "floors", "view" ] + + ,"scale": + [ { "name": "sqft", "method": "mean-subtraction" } + ,{ "name": "saleprice", "method": "z-score" } + ,{ "name": "askingprice", "method": "z-score" } + ] +} \ No newline at end of file diff --git a/docs/site/files/dml-language-reference/homes.csv b/docs/site/files/dml-language-reference/homes.csv new file mode 100644 index 00000000000..aeed6013017 --- /dev/null +++ b/docs/site/files/dml-language-reference/homes.csv @@ -0,0 +1,149 @@ +zipcode,district,sqft,numbedrooms,numbathrooms,floors,view,saleprice,askingprice +95141,west,1373,7,1,3,FALSE,695,698 +91312,south,3261,6,2,2,FALSE,902,906 +94555,north,1835,3,3,3,TRUE,888,892 +95141,east,2833,6,2.5,2,TRUE,927,932 +96334,south,2742,6,2.5,2,FALSE,872,876 +96334,north,2195,5,2.5,2,FALSE,799,803 +98755,north,3469,7,2.5,2,FALSE,958,963 +96334,west,1685,7,1.5,2,TRUE,757,760 +95141,west,2238,4,3,3,FALSE,894,899 +91312,west,1245,4,1,1,FALSE,547,549 +98755,south,3702,7,3,1,FALSE,959,964 +98755,north,1865,7,1,2,TRUE,742,745 +94555,north,3837,3,1,1,FALSE,839,842 +91312,west,2139,3,1,3,TRUE,820,824 +95141,north,3824,4,3,1,FALSE,954,958 +98755,east,2858,5,1.5,1,FALSE,759,762 +91312,south,1827,7,3,1,FALSE,735,738 +91312,south,3557,2,2.5,1,FALSE,888,892 +91312,south,2553,2,2.5,2,TRUE,884,889 +96334,west,1682,3,1.5,1,FALSE,625,628 +98755,south,3926,6,2,2,TRUE,1040,1044 +96334,east,2790,5,2.5,3,FALSE,923,927 +95141,west,3928,4,2,3,FALSE,1037,1042 +94555,south,2000,1,3,2,TRUE,844,848 +96334,east,2688,5,2,3,TRUE,938,943 +94555,south,3533,2,1.5,2,FALSE,890,894 +94555,south,2639,3,2,3,FALSE,876,880 +91312,west,2462,4,2.5,1,TRUE,828,832 +94555,north,2420,1,1.5,3,FALSE,809,813 +96334,west,3911,6,1.5,3,TRUE,1072,1077 +96334,west,2166,6,1.5,3,TRUE,867,872 +94555,south,3855,6,2,1,FALSE,914,918 +91312,west,1971,2,3,1,TRUE,790,794 +95141,east,1769,4,1,1,TRUE,652,655 +98755,north,3774,6,1,2,TRUE,961,966 +96334,west,1044,2,3,1,TRUE,685,688 +95141,north,2561,7,1.5,1,TRUE,790,794 +95141,south,2255,2,2,3,TRUE,883,887 +94555,north,3085,6,2,1,FALSE,819,823 +98755,south,1273,2,1.5,2,FALSE,628,631 +91312,west,3785,5,3,3,TRUE,1133,1138 +91312,west,3270,7,1.5,3,FALSE,943,947 +98755,south,1749,2,2,2,FALSE,712,715 +98755,south,1625,7,1.5,2,FALSE,691,694 +96334,north,3010,7,1.5,2,FALSE,848,851 +91312,south,3919,5,1,3,TRUE,1033,1038 +91312,south,1976,1,2,1,TRUE,726,729 +91312,west,3953,3,1.5,3,FALSE,1006,1010 +95141,west,3439,4,2,2,FALSE,921,925 +94555,east,3570,7,1,2,TRUE,934,938 +98755,west,2484,5,3,2,TRUE,926,931 +94555,south,1349,3,2,2,TRUE,721,724 +98755,west,3967,3,2,3,TRUE,1095,1100 +94555,west,2090,7,3,2,TRUE,885,889 +96334,east,1856,5,2,3,TRUE,841,845 +91312,north,1922,2,3,1,TRUE,775,778 +98755,north,1199,3,3,3,FALSE,761,765 +96334,east,2108,3,1,3,TRUE,806,810 +96334,west,3901,4,2,2,FALSE,976,981 +94555,south,2654,6,1.5,2,TRUE,859,863 +94555,west,3805,6,2,3,TRUE,1085,1090 +95141,south,3199,4,2,3,FALSE,947,951 +98755,west,3786,5,1,1,TRUE,909,913 +94555,east,2160,1,1,1,FALSE,629,631 +95141,east,3152,7,2,1,TRUE,883,887 +94555,east,1592,2,3,2,TRUE,791,795 +95141,east,3903,1,2.5,2,FALSE,976,981 +91312,south,1076,2,2.5,1,FALSE,597,600 +96334,west,1719,1,1.5,3,FALSE,738,742 +94555,north,1439,4,1.5,1,FALSE,589,592 +91312,east,1961,2,3,1,TRUE,775,778 +94555,north,2471,1,1.5,1,TRUE,753,756 +91312,west,3930,4,2.5,2,FALSE,1004,1009 +95141,south,2833,1,1,1,FALSE,718,721 +96334,south,2580,4,1,2,TRUE,816,820 +94555,south,2169,3,2.5,3,TRUE,904,908 +95141,east,3329,4,3,3,TRUE,1064,1069 +96334,south,3392,4,2,3,TRUE,1026,1031 +96334,east,3688,6,2.5,3,FALSE,1032,1037 +98755,west,3347,3,2.5,2,TRUE,991,996 +95141,east,1810,5,1,1,FALSE,606,609 +95141,east,3753,1,2.5,2,FALSE,959,963 +94555,east,3906,2,1.5,1,FALSE,866,870 +96334,east,1732,3,2,1,TRUE,700,703 +96334,south,2188,4,2,1,TRUE,767,771 +96334,south,3750,6,2,2,FALSE,963,967 +98755,north,2331,1,1.5,1,TRUE,740,743 +94555,north,1512,4,3,3,TRUE,854,858 +98755,north,3352,3,3,3,FALSE,1014,1018 +94555,south,3426,3,2.5,2,FALSE,937,941 +98755,south,3211,5,3,1,TRUE,948,953 +98755,west,2747,2,2.5,1,FALSE,803,806 +96334,east,3952,6,1.5,1,TRUE,946,950 +91312,north,3814,6,1.5,2,FALSE,934,938 +95141,south,3700,7,2.5,1,FALSE,929,933 +95141,east,3154,4,2.5,1,TRUE,898,902 +91312,south,2648,4,1.5,2,FALSE,793,797 +98755,north,1394,4,1.5,1,FALSE,587,590 +91312,west,2709,5,2,2,FALSE,837,841 +94555,east,3946,6,1,2,TRUE,974,978 +91312,north,3905,6,2,2,FALSE,973,977 +98755,east,3248,5,1.5,1,TRUE,860,864 +96334,north,1774,7,1.5,1,FALSE,644,647 +94555,east,1995,2,3,3,TRUE,897,902 +94555,east,2876,2,3,1,FALSE,828,832 +94555,east,3229,4,2,3,TRUE,995,1000 +94555,north,1079,5,2,2,FALSE,638,641 +95141,south,3695,7,2.5,3,FALSE,1046,1051 +96334,west,3694,5,1,1,TRUE,897,901 +98755,west,1918,5,1,2,FALSE,693,697 +94555,south,1647,6,1,2,TRUE,713,716 +96334,west,2691,3,2.5,2,FALSE,858,862 +95141,south,1333,2,2,2,TRUE,716,719 +95141,west,2609,4,2,1,FALSE,765,768 +91312,west,2125,3,1,2,TRUE,760,763 +91312,west,2417,5,1,1,FALSE,689,692 +98755,west,3623,2,1,3,TRUE,995,999 +98755,north,3343,6,3,1,FALSE,908,912 +96334,south,1074,7,2.5,3,FALSE,739,743 +96334,south,2972,3,1,2,TRUE,858,862 +91312,east,1637,2,2,1,FALSE,626,629 +91312,north,1807,2,3,2,FALSE,765,768 +95141,north,1457,2,3,1,FALSE,667,670 +91312,west,3043,6,1,1,FALSE,766,770 +91312,west,3045,6,1.5,3,TRUE,967,972 +98755,north,1980,5,1,1,TRUE,688,691 +98755,west,1112,3,1.5,3,TRUE,732,735 +98755,south,1533,6,1.5,3,FALSE,734,738 +91312,east,1442,5,2,2,FALSE,675,678 +91312,north,3171,6,1,3,TRUE,945,949 +96334,east,3072,5,1.5,2,FALSE,842,846 +94555,east,3506,4,1.5,3,TRUE,1000,1005 +94555,south,1574,2,1,3,FALSE,691,694 +94555,east,3567,6,3,1,FALSE,926,931 +91312,south,1194,1,1,2,TRUE,637,640 +94555,east,1031,3,1.5,1,FALSE,532,535 +94555,south,2776,3,2.5,2,TRUE,916,920 +91312,south,2009,5,1.5,1,TRUE,719,723 +96334,north,3784,2,1,2,FALSE,889,893 +94555,west,1975,6,1.5,2,FALSE,729,732 +98755,west,2444,2,3,2,FALSE,854,857 +95141,south,1684,3,1.5,3,FALSE,737,740 +98755,north,1729,6,1,1,TRUE,663,666 +95141,north,2236,1,1,2,FALSE,702,705 +95141,south,2061,7,3,1,FALSE,764,768 +98755,south,3561,3,2.5,3,TRUE,1070,1075 +94555,east,2143,3,1,2,FALSE,694,697 +96334,north,3840,7,1,1,FALSE,858,862 diff --git a/docs/site/files/dml-language-reference/homes.csv.mtd b/docs/site/files/dml-language-reference/homes.csv.mtd new file mode 100644 index 00000000000..c47626a9bff --- /dev/null +++ b/docs/site/files/dml-language-reference/homes.csv.mtd @@ -0,0 +1,5 @@ +{ + "data_type": "frame", + "format": "csv", + "header": true, +} diff --git a/docs/site/files/dml-language-reference/homes.tfspec_bin2.json b/docs/site/files/dml-language-reference/homes.tfspec_bin2.json new file mode 100644 index 00000000000..a5a5375fb6f --- /dev/null +++ b/docs/site/files/dml-language-reference/homes.tfspec_bin2.json @@ -0,0 +1,5 @@ +{ + "recode": [ zipcode, "district", "view" ], "bin": [ + { "name": "saleprice" , "method": "equi-width", "numbins": 3 } + ,{ "name": "sqft", "method": "equi-width", "numbins": 4 }] + } \ No newline at end of file diff --git a/docs/site/files/dml-language-reference/homes.tfspec_recode2.json b/docs/site/files/dml-language-reference/homes.tfspec_recode2.json new file mode 100644 index 00000000000..d4466282723 --- /dev/null +++ b/docs/site/files/dml-language-reference/homes.tfspec_recode2.json @@ -0,0 +1,2 @@ +{ + "recode": [ "zipcode", "district", "view" ] } \ No newline at end of file