# 猜題 ## 各縣市警察局有幾個 > police = LOAD '/dataset/5958/5958.csv' USING PigStorage(',') AS (name: chararray, code: chararray, address: chararray); foreach_police = FOREACH police GENERATE $0,SUBSTRING($2,0,3); gp_police = GROUP foreach_police BY $1; count_police = FOREACH gp_police GENERATE $0,COUNT($1); dump colleage_police; ``` (南投縣,99) (嘉義市,15) (嘉義縣,87) (基隆市,28) (宜蘭縣,62) (屏東縣,91) (彰化縣,81) (新北市,176) (新竹市,19) (新竹縣,61) (桃園市,95) (澎湖縣,28) (臺中市,133) (臺北市,107) (臺南市,163) (臺東縣,67) (花蓮縣,73) (苗栗縣,69) (連江縣,7) (金門縣,9) (雲林縣,72) (高雄市,153) ``` ## 各縣市國小有幾間 > element = LOAD '/dataset/6087/6087.csv' Using PigStorage (',') AS(code:chararray,school:chararray,city:chararray,address:chararray, phone:chararray,url:chararray); foreach_element = FOREACH element GENERATE $1,$2; gp_element = GROUP foreach_element BY $1; count_element = FOREACH gp_element GENERATE $0,COUNT($1); dump count_element; ``` (南投縣,139) (嘉義市,20) (嘉義縣,124) (基隆市,42) (宜蘭縣,76) (屏東縣,168) (彰化縣,175) (新北市,216) (新竹市,34) (新竹縣,86) (桃園市,190) (澎湖縣,37) (臺中市,236) (臺北市,151) (臺南市,211) (臺東縣,88) (花蓮縣,103) (苗栗縣,114) (連江縣,7) (金門縣,19) (雲林縣,155) (高雄市,242) ``` ## 各縣市平均一所小學有幾所警察局 > element = LOAD '/dataset/6087/6087.csv' Using PigStorage (',') AS(code:chararray,school:chararray,city:chararray,address:chararray, phone:chararray,url:chararray); foreach_element = FOREACH element GENERATE $1,$2; gp_element = GROUP foreach_element BY $1; count_element = FOREACH gp_element GENERATE $0,COUNT($1); > police = LOAD '/dataset/5958/5958.csv' USING PigStorage(',') AS (name: chararray, code: chararray, address: chararray); foreach_police = FOREACH police GENERATE $0,SUBSTRING($2,0,3); gp_police = GROUP foreach_police BY $1; count_police = FOREACH gp_police GENERATE $0,COUNT($1); > join_element_police = JOIN count_element BY $0,count_police BY $0; element_police = FOREACH join_element_police GENERATE $0,$1,$3; per_school = FOREACH element_police GENERATE $0, ROUND_TO((double)$2/$1,2); dump per_school ``` (南投縣,0.71) (嘉義市,0.75) (嘉義縣,0.7) (基隆市,0.67) (宜蘭縣,0.82) (屏東縣,0.54) (彰化縣,0.46) (新北市,0.81) (新竹市,0.56) (新竹縣,0.71) (桃園市,0.5) (澎湖縣,0.76) (臺中市,0.56) (臺北市,0.71) (臺南市,0.77) (臺東縣,0.76) (花蓮縣,0.71) (苗栗縣,0.61) (連江縣,1.0) (金門縣,0.47) (雲林縣,0.46) (高雄市,0.63) ``` ## 各縣市幼兒園有幾間 > kid = LOAD '/dataset/6086/6086.csv' Using PigStorage (',') AS(code:chararray,school:chararray,city:chararray,address:chararray, phone:chararray); foreach_kid= FOREACH kid GENERATE $1,$2; gp_kid = GROUP foreach_kid BY $1; count_kid = FOREACH gp_kid GENERATE $0,COUNT($1); dump count_kid; ``` (南投縣,184) (嘉義市,69) (嘉義縣,153) (基隆市,107) (宜蘭縣,124) (屏東縣,289) (彰化縣,370) (新北市,1134) (新竹市,161) (新竹縣,237) (桃園市,584) (澎湖縣,27) (臺中市,737) (臺北市,689) (臺南市,565) (臺東縣,122) (花蓮縣,135) (苗栗縣,182) (連江縣,5) (金門縣,26) (雲林縣,146) (高雄市,674) ``` ## 各縣市平均一所幼稚園有幾所警察局 > kid = LOAD '/dataset/6086/6086.csv' Using PigStorage (',') AS(code:chararray,school:chararray,city:chararray,address:chararray, phone:chararray); foreach_kid= FOREACH kid GENERATE $1,$2; gp_kid = GROUP foreach_kid BY $1; count_kid = FOREACH gp_kid GENERATE $0,COUNT($1); > police = LOAD '/dataset/5958/5958.csv' USING PigStorage(',') AS (name: chararray, code: chararray, address: chararray); foreach_police = FOREACH police GENERATE $0,SUBSTRING($2,0,3); gp_police = GROUP foreach_police BY $1; count_police = FOREACH gp_police GENERATE $0,COUNT($1); > join_kid_police = JOIN count_kid BY $0,count_police BY $0; kid_police = FOREACH join_kid_police GENERATE $0,$1,$3; per_kid = FOREACH kid_police GENERATE $0, ROUND_TO((double)$2/$1,2); dump per_kid; ``` (南投縣,0.54) (嘉義市,0.22) (嘉義縣,0.57) (基隆市,0.26) (宜蘭縣,0.5) (屏東縣,0.31) (彰化縣,0.22) (新北市,0.16) (新竹市,0.12) (新竹縣,0.26) (桃園市,0.16) (澎湖縣,1.04) (臺中市,0.18) (臺北市,0.16) (臺南市,0.29) (臺東縣,0.55) (花蓮縣,0.54) (苗栗縣,0.38) (連江縣,1.4) (金門縣,0.35) (雲林縣,0.49) (高雄市,0.23) ``` ## 各縣市大學生有幾間 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); foreach_colleage = FOREACH colleage GENERATE $0,$1; gp_colleage = GROUP foreach_colleage BY $0; count_colleage = FOREACH gp_colleage GENERATE $0,COUNT($1); dump count_colleage; ``` (南投縣,115) (嘉義市,155) (嘉義縣,263) (基隆市,149) (宜蘭縣,126) (屏東縣,334) (彰化縣,356) (新北市,1039) (新竹市,456) (新竹縣,130) (桃園市,708) (澎湖縣,22) (臺中市,1324) (臺北市,2072) (臺南市,966) (臺東縣,70) (花蓮縣,202) (苗栗縣,148) (金門縣,41) (雲林縣,209) (高雄市,1196) ``` ## 各縣市平均一所大專院校有幾所警察局 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); foreach_colleage = FOREACH colleage GENERATE $0,$1; gp_colleage = GROUP foreach_colleage BY $0; count_colleage = FOREACH gp_colleage GENERATE $0,COUNT($1); > police = LOAD '/dataset/5958/5958.csv' USING PigStorage(',') AS (name: chararray, code: chararray, address: chararray); foreach_police = FOREACH police GENERATE $0,SUBSTRING($2,0,3); gp_police = GROUP foreach_police BY $1; count_police = FOREACH gp_police GENERATE $0,COUNT($1); > join_colleage_police = JOIN count_colleage BY $0,count_police BY $0; colleage_police = FOREACH join_colleage_police GENERATE $0,$1,$3; per_colleage = FOREACH colleage_police GENERATE $0, ROUND_TO((double)$2/$1,2); dump per_colleage; ``` (南投縣,0.86) (嘉義市,0.1) (嘉義縣,0.33) (基隆市,0.19) (宜蘭縣,0.49) (屏東縣,0.27) (彰化縣,0.23) (新北市,0.17) (新竹市,0.04) (新竹縣,0.47) (桃園市,0.13) (澎湖縣,1.27) (臺中市,0.1) (臺北市,0.05) (臺南市,0.17) (臺東縣,0.96) (花蓮縣,0.36) (苗栗縣,0.47) (金門縣,0.22) (雲林縣,0.34) (高雄市,0.13) ``` ## 各縣市學生老師比 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); gp_colleage = GROUP colleage BY $0; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); foreach_colleage = FOREACH sum_colleage GENERATE $0, ROUND_TO((double)$1/$2,2); dump foreach_colleage; ``` (南投縣,25.01) (嘉義市,25.52) (嘉義縣,24.53) (基隆市,23.66) (宜蘭縣,22.5) (屏東縣,28.77) (彰化縣,28.7) (新北市,31.35) (新竹市,22.37) (新竹縣,31.66) (桃園市,26.62) (澎湖縣,24.46) (臺中市,30.13) (臺北市,24.95) (臺南市,26.27) (臺東縣,22.89) (花蓮縣,18.78) (苗栗縣,29.3) (金門縣,30.21) (雲林縣,29.03) (高雄市,27.76) ``` ## 各部別的一個老師分別負責幾個學生 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); gp_colleage = GROUP colleage BY $3; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); foreach_colleage = FOREACH sum_colleage GENERATE $0, ROUND_TO((double)$1/$2,2); dump foreach_colleage; ``` (修,505.74) (日,22.69) (職,1094.08) (P進,747.8) ``` ## 各部別學生老師比例 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); gp_colleage = GROUP colleage BY $3; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); a = FOREACH sum_colleage GENERATE $0,ROUND_TO((double)$1/(($1+$2)*0.01),2), ROUND_TO((double)$2/(($1+$2)*0.01),2); ``` (修,99.8,0.2) (日,95.78,4.22) (職,99.91,0.09) (P進,99.87,0.13) ``` ## 各部門有關資訊管理及資訊工程學生與老師數量 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); filter_colleage = FILTER colleage BY $2 matches '資訊管理.*' OR $2 matches '資訊工程.*'; gp_colleage = GROUP filter_colleage BY $3; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5), SUM($1.$6); dump sum_colleage; ``` (修,7519,17) (日,60867,2327) (職,2278,0) (P進,1219,0) ``` ## 資訊開頭的科系,學士、碩士、博士、五專、二技 學生/老師比例 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); filter_colleage = FILTER colleage BY $2 matches '資訊.*'; gp_colleage = GROUP filter_colleage BY $4; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5), SUM($1.$6); percent_colleage = FOREACH sum_colleage GENERATE $0,ROUND_TO((double)$1/(($1+$2)*0.01),2), ROUND_TO((double)$2/(($1+$2)*0.01),2); dump percent_colleage; ``` (博士,100.0,0.0) (四技,96.62,3.38) (學士,95.96,4.04) (碩士,99.47,0.53) (2二專,98.28,1.72) (5五專,98.9,1.1) (C二技,100.0,0.0) (,0.0,100.0) ``` ## 縣市部別的學生與老師的比例 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); filter_colleage = FILTER colleage BY $3 == '修'; gp_colleage = GROUP filter_colleage BY $0; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); a = FOREACH sum_colleage GENERATE $0,ROUND_TO((double)$1/(($1+$2)*0.01),2), ROUND_TO((double)$2/(($1+$2)*0.01),2); ``` (南投縣,修,100.0,0.0) (嘉義市,修,99.66,0.34) (嘉義縣,修,99.91,0.09) (基隆市,修,100.0,0.0) (宜蘭縣,修,,) (屏東縣,修,99.7,0.3) (彰化縣,修,99.67,0.33) (新北市,修,99.91,0.09) (新竹市,修,99.93,0.07) (新竹縣,修,99.84,0.16) (桃園市,修,99.87,0.13) (澎湖縣,修,100.0,0.0) (臺中市,修,99.9,0.1) (臺北市,修,99.81,0.19) (臺南市,修,99.81,0.19) (臺東縣,修,100.0,0.0) (花蓮縣,修,99.02,0.98) (苗栗縣,修,99.01,0.99) (雲林縣,修,99.88,0.12) (高雄市,修,99.72,0.28) ``` > filter_colleage = FILTER colleage BY $3 == '日'; gp_colleage = GROUP filter_colleage BY $0; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); a = FOREACH sum_colleage GENERATE $0,ROUND_TO((double)$1/(($1+$2)*0.01),2), ROUND_TO((double)$2/(($1+$2)*0.01),2); ``` (南投縣,日,95.65,4.35) (嘉義市,日,95.34,4.66) (嘉義縣,日,95.37,4.63) (基隆市,日,95.48,4.52) (宜蘭縣,日,95.5,4.5) (屏東縣,日,95.97,4.03) (彰化縣,日,95.78,4.22) (新北市,日,96.29,3.71) (新竹市,日,95.23,4.77) (新竹縣,日,95.52,4.48) (桃園市,日,95.61,4.39) (澎湖縣,日,95.57,4.43) (臺中市,日,96.11,3.89) (臺北市,日,95.68,4.32) (臺南市,日,95.67,4.33) (臺東縣,日,95.19,4.81) (花蓮縣,日,94.52,5.48) (苗栗縣,日,96.1,3.9) (金門縣,日,95.99,4.01) (雲林縣,日,96.08,3.92) (高雄市,日,95.7,4.3) ``` > filter_colleage = FILTER colleage BY $3 == '職'; gp_colleage = GROUP filter_colleage BY $0; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); a = FOREACH sum_colleage GENERATE $0,ROUND_TO((double)$1/(($1+$2)*0.01),2), ROUND_TO((double)$2/(($1+$2)*0.01),2); ``` (南投縣,職,100.0,0.0) (嘉義市,職,100.0,0.0) (嘉義縣,職,100.0,0.0) (基隆市,職,99.84,0.16) (宜蘭縣,職,100.0,0.0) (屏東縣,職,99.5,0.5) (彰化縣,職,100.0,0.0) (新北市,職,100.0,0.0) (新竹市,職,99.93,0.07) (新竹縣,職,100.0,0.0) (桃園市,職,99.95,0.05) (澎湖縣,職,100.0,0.0) (臺中市,職,99.97,0.03) (臺北市,職,99.92,0.08) (臺南市,職,99.75,0.25) (臺東縣,職,100.0,0.0) (花蓮縣,職,100.0,0.0) (苗栗縣,職,100.0,0.0) (金門縣,職,100.0,0.0) (雲林縣,職,99.09,0.91) (高雄市,職,99.92,0.08) ``` > filter_colleage = FILTER colleage BY $3 == 'P進'; gp_colleage = GROUP filter_colleage BY $0; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5),SUM($1.$6); a = FOREACH sum_colleage GENERATE $0,ROUND_TO((double)$1/(($1+$2)*0.01),2), ROUND_TO((double)$2/(($1+$2)*0.01),2); ``` (嘉義市,P進,100.0,0.0) (嘉義縣,P進,100.0,0.0) (基隆市,P進,100.0,0.0) (宜蘭縣,P進,100.0,0.0) (屏東縣,P進,100.0,0.0) (彰化縣,P進,100.0,0.0) (新北市,P進,99.85,0.15) (新竹市,P進,99.86,0.14) (桃園市,P進,99.82,0.18) (臺中市,P進,99.84,0.16) (臺北市,P進,99.78,0.22) (臺南市,P進,100.0,0.0) (臺東縣,P進,100.0,0.0) (苗栗縣,P進,99.37,0.63) (金門縣,P進,100.0,0.0) (高雄市,P進,100.0,0.0) ``` ## 請問臺北市所有大學資訊工程系人數 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS(city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); filter_colleage = FILTER colleage BY $0 == '臺北市' AND $2 matches '資訊工程.*'; gp_colleage = GROUP filter_colleage BY $0; sum_colleage = FOREACH gp_colleage GENERATE $0, SUM($1.$5)+SUM($1.$6); dump sum_colleage; ``` (臺北市,4948) ``` ## 資訊開頭的科系,各部門老師平均一人負責幾個學生 > colleage = LOAD '/dataset/9621/9621.csv' Using PigStorage (',') AS (city:chararray,school:chararray,faculty:chararray,courses:chararray,level:chararray,student:int,teachers:int); filter_colleage = FILTER colleage BY $2 matches '資訊.*'; gp_colleage = GROUP filter_colleage BY $3; sum_colleage = FOREACH gp_colleage GENERATE $0, ROUND_TO((double)SUM($1.$5)/SUM($1.$6),2); dump sum_colleage; ``` (修,464.55) (日,26.24) (職,) (P進,) ```