delta constant 1 348 198 0 false minsup constant 2 330 137 5 false delta constant 3 446 155 0 false minsup constant 4 430 94 5 false cover constant 5 458 215 3 false minsup constant 6 95 113 Ariane 25 true %alea mv constant 7 196 198 Ariane 0 true heart-nom.csv loader 8 7 306 ./data/heart-nom.csv Ariane 1 heart-nom.col loader 9 3 386 ./data/heart-nom.col Ariane 1 delta constant 10 113 182 Ariane 0 true random-mv-insertion macro-operator 11 210 294 1 2 1 filename 2 11 16 ./script/addMV.awk false introRandom system 3 64 87 awk -f $p $i > $o 1 3 1 mv-density mv-density 4 191 148 missing values 1 mv-density mv density system 2 65 44 awk -F, $p $i > $o 1 1 1 setstatus setstatus 3 150 46 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 '{total+=NF;for(i=1;i<=NF;i++)if($i=="?")mv++}END{print mv/total}' 3 InSlotImage 0 2 OutSlotImage 0 0 InSlotImage 0 3 OutSlotImage 0 0 InSlotImage 0 3 OutSlotImage 0 0 InSlotParameter 0 4 OutSlotResult 0 0 InSlotParameter 0 4 OutSlotResult 0 3 InSlotImage 0 0 OutSlotImage 0 3 InSlotParameter 0 2 OutSlotResult 0 3 InSlotParameter 1 0 OutSlotResult 0 3 InSlotParameter 2 0 OutSlotResult 1 4 InSlotImage 0 3 OutSlotImage 0 rule-mv-insertion macro-operator 12 105 294 1 2 1 mvleila system 2 138 126 mvleila $p $i > $o 1 2 1 grep _ system 3 211 138 sed -n '1d;s/_//pg' $i > $o 1 1 wc -l wc -l 4 339 34 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 mv-insertion for 5 335 114 2 3 1 filename 2 269 159 ./script/mv-insertion.awk false max item system 3 257 64 awk $p $i > $o 1 1 1 apply system 4 329 247 awk -f $p0 $i $p1 > $o 2 2 1 setstatus setstatus 5 319 66 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 awk system 6 64 44 awk $p0 $i $p1 > $o 1 2 1 0 InSlotImage 0 4 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 4 OutSlotImage 0 0 InSlotImage 0 4 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 4 OutSlotImage 0 0 InSlotParameter 0 4 OutSlotResult 0 0 InSlotParameter 0 4 OutSlotResult 0 3 InSlotImage 0 0 OutSlotImage 1 3 InSlotParameter 0 '{if($NF!="?" && $NF>max)max=$NF}END{print max}' 4 InSlotImage 0 0 OutSlotImage 1 true 0 15 106 1 209 106 2 209 289 3 328 289 4 InSlotImage 1 6 OutSlotImage 0 true 0 113 86 1 132 86 2 132 300 3 328 300 4 InSlotParameter 0 2 OutSlotResult 0 4 InSlotParameter 1 5 OutSlotResult 0 5 InSlotImage 0 3 OutSlotImage 0 6 InSlotImage 0 0 OutSlotImage 0 6 InSlotParameter 0 'BEGIN{line=ARGV[2];ARGC--}NR==line{print;exit}' 6 InSlotParameter 1 0 OutSlotResult 0 max item system 6 432 38 awk $p $i > $o 1 1 1 setstatus setstatus 7 494 40 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 rename system 8 504 137 awk $p0 $i $p1 > $o 1 2 1 note 9 760 409 iterating over these rules for replacing the items in the conclusion by a new symbol meaning missing value note 10 132 215 computing some rules note 11 469 218 renaming the mv to ? mv-density mv-density 12 633 299 missing values 1 mv-density mv density system 2 65 44 awk -F, $p $i > $o 1 1 1 setstatus setstatus 3 150 46 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 '{total+=NF;for(i=1;i<=NF;i++)if($i=="?")mv++}END{print mv/total}' 3 InSlotImage 0 2 OutSlotImage 0 sed system 13 24 44 sed $p $i > $o 1 1 1 0 InSlotImage 0 8 OutSlotImage 0 0 InSlotImage 0 8 OutSlotImage 0 0 InSlotParameter 0 12 OutSlotResult 0 0 InSlotParameter 0 12 OutSlotResult 0 2 InSlotImage 0 13 OutSlotImage 0 2 InSlotParameter 0 0 OutSlotResult 0 2 InSlotParameter 1 0 OutSlotResult 1 true 0 106 12 1 106 52 2 160 52 3 160 126 3 InSlotImage 0 2 OutSlotImage 0 4 InSlotImage 0 3 OutSlotImage 0 5 InSlotImage 0 3 OutSlotImage 0 5 InSlotImage 1 13 OutSlotImage 0 5 InSlotParameter 0 1 5 InSlotParameter 1 4 OutSlotResult 0 5 InSlotParameter 2 1 6 InSlotImage 0 13 OutSlotImage 0 6 InSlotParameter 0 '{if($NF!="?" && $NF>max)max=$NF}END{print max}' 7 InSlotImage 0 6 OutSlotImage 0 8 InSlotImage 0 5 OutSlotImage 0 8 InSlotParameter 0 'BEGIN{new=ARGV[2];ARGC--}{printf("%d",$1);for(i=2;i<=NF;i++)if($i>new)printf(",?");else printf(",%d",$i);printf("\n");}' 8 InSlotParameter 1 7 OutSlotResult 0 12 InSlotImage 0 8 OutSlotImage 0 13 InSlotImage 0 0 OutSlotImage 0 13 InSlotParameter 0 's/,/ /g' cluster stability macro-operator 13 625 282 2 1 csv to bin system 2 137 62 sed $p $i > $o 1 1 1 kmeans system 3 235 62 kmeans $p $i > $o 1 1 1 csv to bin system 4 136 134 sed $p $i > $o 1 1 1 kmeans system 5 236 134 kmeans $p $i > $o 1 1 1 1st col system 6 307 62 sed $p $i > $o 1 1 1 1st col system 7 309 134 sed $p $i > $o 1 1 1 paste system 8 383 105 paste $i > $o 2 1 filename 9 394 25 ./script/clusterStability.awk false awk system 10 469 104 awk -f $p $i > $o 1 1 1 setstatus setstatus 11 564 106 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 11 OutSlotResult 0 0 InSlotParameter 0 11 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 's/,/ /g' 3 InSlotImage 0 2 OutSlotImage 0 3 InSlotParameter 0 0 OutSlotResult 0 4 InSlotImage 0 0 OutSlotImage 1 4 InSlotParameter 0 's/,/ /g' 5 InSlotImage 0 4 OutSlotImage 0 5 InSlotParameter 0 0 OutSlotResult 0 6 InSlotImage 0 3 OutSlotImage 0 6 InSlotParameter 0 '1d;s/ .*//' 7 InSlotImage 0 5 OutSlotImage 0 7 InSlotParameter 0 '1d;s/ .*//' 8 InSlotImage 0 6 OutSlotImage 0 8 InSlotImage 1 7 OutSlotImage 0 10 InSlotImage 0 8 OutSlotImage 0 10 InSlotParameter 0 9 OutSlotResult 0 11 InSlotImage 0 10 OutSlotImage 0 K constant 14 620 219 3 false classification imputation macro-operator 15 440 305 2 3 1 random completion macro-operator 2 310 130 2 3 1 dictionary system 2 58 239 dictionary $i > $o 2 1 mv detection system 3 81 119 awk -F, $p $i > $o 1 1 1 wc -l wc -l 4 255 121 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 column completion iteration for 5 251 204 4 6 1 awk system 2 64 44 awk $p0 $i $p1 > $o 1 2 1 segmentation system 3 289 432 segmentation $i $o 2 2 col filter system 4 161 420 awk -F, $p0 $i $p1 > $o 1 2 1 note 5 296 372 model mv-order macro-operator 6 424 433 1 1 grep - system 2 131 141 sed -n /-/p $i > $o 1 1 grep -v - system 3 130 75 grep -v - $i > $o 1 1 cat system 4 194 78 cat $i > $o 2 1 0 InSlotImage 0 4 OutSlotImage 0 0 InSlotImage 0 4 OutSlotImage 0 0 InSlotParameter 0 4 OutSlotResult 0 0 InSlotParameter 0 4 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 0 OutSlotImage 0 4 InSlotImage 0 3 OutSlotImage 0 4 InSlotImage 1 2 OutSlotImage 0 col dictionary system 7 512 246 awk $p0 $i $p1 > $o 1 2 1 note 8 298 527 targets head -1 system 9 591 258 head -1 $i > $o 1 1 setstatus setstatus 10 587 320 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 col filter system 11 161 609 awk -F, $p0 $i $p1 > $o 1 2 1 segmentation system 12 288 584 segmentation $i $o 2 2 touch touch 13 594 455 shell 1 touch echo -n eval101 2 155 155 eval 1 1 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotParameter 0 echo -n tail -1 system 14 663 258 tail -1 $i > $o 1 1 setstatus setstatus 15 667 323 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 for 16 677 419 3 6 1 mvminer system 2 101 180 mvminer $p $i > $o 1 2 1 grep _ system 3 228 192 sed -n /_/p $i > $o 1 1 rule filter system 4 394 77 awk $p0 $i $p1 > $o 1 2 1 sed system 5 489 77 sed $p $i > $o 1 1 1 chisquare system 6 591 187 chisquare $p $i > $o 2 1 1 cover system 7 720 198 cover $p $i > $o 2 1 1 rulescore system 8 829 221 rulescore $i > $o 2 1 remove mv system 9 452 209 sed $p $i > $o 1 1 1 note 10 147 130 compute rules paste system 11 1038 265 paste $i > $o 2 1 remove mv system 12 325 338 sed $p $i > $o 1 1 1 0 InSlotImage 0 11 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 true 0 15 106 1 1000 106 2 1000 306 3 1109 306 0 InSlotImage 3 11 OutSlotImage 0 0 InSlotImage 0 11 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 true 0 15 106 1 1000 106 2 1000 306 3 1109 306 0 InSlotImage 3 11 OutSlotImage 0 0 InSlotParameter 0 11 OutSlotResult 0 0 InSlotParameter 0 11 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 0 OutSlotResult 1 2 InSlotParameter 1 0 OutSlotResult 2 3 InSlotImage 0 2 OutSlotImage 0 4 InSlotImage 0 3 OutSlotImage 0 4 InSlotParameter 0 'BEGIN{target="_" ARGV[2];ARGC--;}{for(i=1;i<=NF;i++)if($i==target)print}' 4 InSlotParameter 1 0 OutSlotResult 0 5 InSlotImage 0 4 OutSlotImage 0 5 InSlotParameter 0 's/,.*//' 6 InSlotImage 0 5 OutSlotImage 0 6 InSlotImage 1 9 OutSlotImage 0 6 InSlotParameter 0 0 OutSlotResult 0 7 InSlotImage 0 6 OutSlotImage 0 7 InSlotImage 1 9 OutSlotImage 0 7 InSlotParameter 0 0 OutSlotResult 3 true 0 146 12 1 146 23 2 732 23 3 732 198 8 InSlotImage 0 7 OutSlotImage 0 8 InSlotImage 1 12 OutSlotImage 0 9 InSlotImage 0 0 OutSlotImage 0 9 InSlotParameter 0 's/-[0-9]* //g' 11 InSlotImage 0 0 OutSlotImage 2 11 InSlotImage 1 8 OutSlotImage 0 12 InSlotImage 0 0 OutSlotImage 1 12 InSlotParameter 0 's/-[0-9]* //g' vote filename 17 778 161 ./script/vote.awk false setstatus setstatus 18 151 151 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 cat system 19 1336 447 cat $i > $o 2 1 awk system 20 799 235 awk -f $p0 $i $p1 > $o 2 2 1 data system 21 229 610 sed $p $i > $o 1 1 1 lines system 22 228 676 awk -F, $p $i > $o 1 1 1 paste system 23 902 235 paste $p $i > $o 2 1 1 0 InSlotImage 0 19 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 3 0 OutSlotImage 2 0 InSlotImage 4 19 OutSlotImage 0 0 InSlotImage 0 19 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 3 0 OutSlotImage 2 0 InSlotImage 4 19 OutSlotImage 0 0 InSlotParameter 0 20 OutSlotResult 0 true 0 831 304 1 831 719 2 486 719 3 486 774 0 InSlotParameter 0 20 OutSlotResult 0 true 0 831 304 1 831 719 2 486 719 3 486 774 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 'BEGIN{line=ARGV[2];ARGC--}NR==line{print;exit}' 2 InSlotParameter 1 0 OutSlotResult 0 3 InSlotImage 0 4 OutSlotImage 0 3 InSlotImage 1 0 OutSlotImage 2 4 InSlotImage 0 0 OutSlotImage 1 true 0 15 106 1 46 106 2 46 462 3 160 462 4 InSlotParameter 0 'BEGIN{col=ARGV[2];ARGC--}{if($col=="?")next}{print}' 4 InSlotParameter 1 18 OutSlotResult 0 6 InSlotImage 0 3 OutSlotImage 0 7 InSlotImage 0 3 OutSlotImage 1 7 InSlotParameter 0 'BEGIN{col=ARGV[2];ARGC--;target="#" (col-1)}NF==0{exit}$0 ~ target{go=1;next}/#/{if(go)exit}{if(go)print $1}' 7 InSlotParameter 1 18 OutSlotResult 0 9 InSlotImage 0 7 OutSlotImage 0 10 InSlotImage 0 9 OutSlotImage 0 11 InSlotImage 0 0 OutSlotImage 1 true 0 15 106 1 45 106 2 45 651 3 160 651 11 InSlotParameter 0 'BEGIN{col=ARGV[2];ARGC--}{if($col=="?")print $0 "," NR}' 11 InSlotParameter 1 18 OutSlotResult 0 12 InSlotImage 0 21 OutSlotImage 0 12 InSlotImage 1 0 OutSlotImage 2 14 InSlotImage 0 7 OutSlotImage 0 15 InSlotImage 0 14 OutSlotImage 0 16 InSlotImage 0 6 OutSlotImage 0 16 InSlotImage 1 12 OutSlotImage 0 true 0 359 625 1 648 625 2 648 484 3 676 484 16 InSlotImage 2 13 OutSlotImage 0 16 InSlotParameter 0 10 OutSlotResult 0 16 InSlotParameter 1 15 OutSlotResult 0 16 InSlotParameter 2 1 16 InSlotParameter 3 0 OutSlotResult 1 true 0 106 12 1 106 42 2 719 42 3 719 419 16 InSlotParameter 4 0 OutSlotResult 2 true 0 126 12 1 126 33 2 729 33 3 729 419 16 InSlotParameter 5 0 OutSlotResult 3 true 0 146 12 1 146 24 2 739 24 3 739 419 18 InSlotImage 0 2 OutSlotImage 0 true 0 113 86 1 136 86 2 136 191 3 150 191 19 InSlotImage 0 0 OutSlotImage 3 19 InSlotImage 1 23 OutSlotImage 0 true 0 941 288 1 1003 288 2 1003 488 3 1335 488 20 InSlotImage 0 16 OutSlotImage 0 20 InSlotImage 1 7 OutSlotImage 0 20 InSlotParameter 0 17 OutSlotResult 0 20 InSlotParameter 1 18 OutSlotResult 0 true 0 183 207 1 183 227 2 821 227 3 821 235 21 InSlotImage 0 11 OutSlotImage 0 21 InSlotParameter 0 's/,[0-9]*$//' 22 InSlotImage 0 11 OutSlotImage 0 22 InSlotParameter 0 '{print $NF}' 23 InSlotImage 0 22 OutSlotImage 0 true 0 267 718 1 889 718 2 889 277 3 901 277 23 InSlotImage 1 20 OutSlotImage 0 23 InSlotParameter 0 --delimiter=" " touch touch 6 177 271 shell 1 touch echo -n eval101 2 155 155 eval 1 1 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotParameter 0 echo -n sort system 7 164 131 sort -k1,1n $i > $o 1 1 sort system 8 436 249 sort $p $i > $o 1 1 1 awk system 9 544 249 awk $p $i > $o 1 1 1 mv remove system 10 486 44 awk -F, $p $i > $o 1 1 1 cat system 11 671 250 cat $i > $o 2 1 sort system 12 734 249 sort $p $i > $o 1 1 1 awk system 13 806 249 awk $p $i > $o 1 1 1 sortitem system 14 871 261 sortitem $i > $o 1 1 bin to csv system 15 932 249 sed $p $i > $o 1 1 1 0 InSlotImage 0 15 OutSlotImage 0 0 InSlotImage 0 15 OutSlotImage 0 0 InSlotParameter 0 5 OutSlotResult 0 0 InSlotParameter 0 5 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 true 0 15 86 1 49 86 2 49 269 3 57 269 2 InSlotImage 1 0 OutSlotImage 1 true 0 15 106 1 34 106 2 34 280 3 57 280 3 InSlotImage 0 0 OutSlotImage 0 3 InSlotParameter 0 '{for(i=1;i<=NF;i++)if($i=="?")mv[i]=1}END{for(i in mv)print i}' 4 InSlotImage 0 7 OutSlotImage 0 5 InSlotImage 0 7 OutSlotImage 0 5 InSlotImage 1 0 OutSlotImage 0 5 InSlotImage 2 2 OutSlotImage 0 5 InSlotImage 3 6 OutSlotImage 0 5 InSlotParameter 0 1 5 InSlotParameter 1 4 OutSlotResult 0 5 InSlotParameter 2 1 5 InSlotParameter 3 0 OutSlotResult 0 true 0 86 12 1 86 41 2 293 41 3 293 204 5 InSlotParameter 4 0 OutSlotResult 1 true 0 106 12 1 106 33 2 303 33 3 303 204 5 InSlotParameter 5 0 OutSlotResult 2 true 0 126 12 1 126 25 2 313 25 3 313 204 7 InSlotImage 0 3 OutSlotImage 0 8 InSlotImage 0 5 OutSlotImage 0 8 InSlotParameter 0 -k1,1n -k2,2n 9 InSlotImage 0 8 OutSlotImage 0 9 InSlotParameter 0 '{if($1!=last){last=$1;if(NR!=1)printf("\n");printf("%d ",$1)}}{printf("%s ",$NF)}END{printf("\n")}' 10 InSlotImage 0 0 OutSlotImage 0 10 InSlotParameter 0 '{printf("%d %d",NR,$1);for(i=2;i<=NF;i++){if($i!="?")printf(" %d",$i);}printf("\n");}' 11 InSlotImage 0 10 OutSlotImage 0 11 InSlotImage 1 9 OutSlotImage 0 12 InSlotImage 0 11 OutSlotImage 0 12 InSlotParameter 0 -k1,1n 13 InSlotImage 0 12 OutSlotImage 0 13 InSlotParameter 0 '{if($1!=last){last=$1;if(NR!=1)printf("\n");}}{for(i=2;i<=NF;i++)printf("%d ",$i)}END{printf("\n")}' 14 InSlotImage 0 13 OutSlotImage 0 15 InSlotImage 0 14 OutSlotImage 0 15 InSlotParameter 0 's/ /,/g;s/,$//' merge 3 427 131 2 1 mv detection system 4 104 44 awk -F, $p $i > $o 1 1 1 wc -l wc -l 5 238 46 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 if 6 240 119 $0 == 0 1 2 2 0 InSlotImage 0 3 OutSlotImage 0 0 InSlotImage 0 3 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 6 OutSlotImage 1 2 InSlotImage 1 0 OutSlotImage 1 2 InSlotParameter 0 0 OutSlotResult 0 true 0 86 12 1 86 41 2 322 41 3 322 130 2 InSlotParameter 1 0 OutSlotResult 1 true 0 106 12 1 106 32 2 332 32 3 332 130 2 InSlotParameter 2 0 OutSlotResult 2 true 0 126 12 1 126 23 2 342 23 3 342 130 3 InSlotImage 0 6 OutSlotImage 0 3 InSlotImage 1 2 OutSlotImage 0 4 InSlotImage 0 0 OutSlotImage 0 4 InSlotParameter 0 '{for(i=1;i<=NF;i++)if($i=="?")mv[i]=1}END{for(i in mv)print i}' 5 InSlotImage 0 4 OutSlotImage 0 6 InSlotImage 0 0 OutSlotImage 0 true 0 15 86 1 67 86 2 67 161 3 239 161 6 InSlotParameter 0 5 OutSlotResult 0 6 InSlotParameter 1 0 surfer imputation macro-operator 16 340 294 2 2 1 surfer imputation macro-operator 2 348 125 2 2 1 note 2 126 53 encode the missing values with new items outputs also the col dictionary returns the max non-missing item mv encode macro-operator 3 189 160 1 2 filename 2 334 137 ./script/mv-code.awk false mv detection system 3 230 218 awk -F, $p $i > $o 1 1 1 sort system 4 313 261 sort -k1,1n $i > $o 1 1 mv-code system 5 375 207 awk -F, -f $p0 $i $p1 > $o 2 2 1 max item system 6 230 67 awk -F, $p $i > $o 1 1 1 setstatus setstatus 7 600 132 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 wc -l wc -l 8 625 251 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 shift system 9 611 326 awk $p > $o 3 1 0 InSlotImage 0 5 OutSlotImage 0 0 InSlotImage 1 9 OutSlotImage 0 0 InSlotImage 0 5 OutSlotImage 0 0 InSlotImage 1 9 OutSlotImage 0 0 InSlotParameter 0 7 OutSlotResult 0 0 InSlotParameter 0 7 OutSlotResult 0 3 InSlotImage 0 0 OutSlotImage 0 3 InSlotParameter 0 '{for(i=1;i<=NF;i++)if($i=="?")mv[i]=1}END{for(i in mv)print i}' 4 InSlotImage 0 3 OutSlotImage 0 5 InSlotImage 0 0 OutSlotImage 0 true 0 15 86 1 187 86 2 187 249 3 374 249 5 InSlotImage 1 4 OutSlotImage 0 5 InSlotParameter 0 2 OutSlotResult 0 5 InSlotParameter 1 7 OutSlotResult 0 6 InSlotImage 0 0 OutSlotImage 0 6 InSlotParameter 0 '{if($NF!="?" && $NF>max)max=$NF}END{print max}' 7 InSlotImage 0 6 OutSlotImage 0 8 InSlotImage 0 4 OutSlotImage 0 9 InSlotParameter 0 'BEGIN{for(i=ARGV[1]+1;i<=ARGV[1]+ARGV[2];i++)print i}' 9 InSlotParameter 1 7 OutSlotResult 0 9 InSlotParameter 2 8 OutSlotResult 0 for 4 410 147 3 5 1 sed system 2 206 295 sed 's/:.*//' $i > $o 1 1 mtsminer system 3 104 283 mtsminer $p 1000 $i > $o 1 3 1 extension system 4 303 295 extension $i > $o 2 1 awk system 5 135 64 awk $p0 $i $p1 > $o 1 2 1 setstatus setstatus 6 199 66 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 cat system 7 751 96 cat $i > $o 2 1 add target system 8 415 294 awk $p0 $i $p1 > $o 1 2 1 0 InSlotImage 0 7 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 3 7 OutSlotImage 0 0 InSlotImage 0 7 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 3 7 OutSlotImage 0 0 InSlotParameter 0 4 OutSlotResult 0 0 InSlotParameter 0 4 OutSlotResult 0 2 InSlotImage 0 3 OutSlotImage 0 3 InSlotImage 0 0 OutSlotImage 0 3 InSlotParameter 0 0 OutSlotResult 1 3 InSlotParameter 1 0 OutSlotResult 2 3 InSlotParameter 2 6 OutSlotResult 0 4 InSlotImage 0 2 OutSlotImage 0 4 InSlotImage 1 0 OutSlotImage 0 true 0 15 86 1 86 86 2 86 336 3 302 336 5 InSlotImage 0 0 OutSlotImage 1 5 InSlotParameter 0 'BEGIN{line=ARGV[2];ARGC--}NR==line{print;exit}' 5 InSlotParameter 1 0 OutSlotResult 0 6 InSlotImage 0 5 OutSlotImage 0 7 InSlotImage 0 0 OutSlotImage 2 7 InSlotImage 1 8 OutSlotImage 0 8 InSlotImage 0 4 OutSlotImage 0 8 InSlotParameter 0 'BEGIN{target=ARGV[2];ARGC--}{print target " : " $0}' 8 InSlotParameter 1 6 OutSlotResult 0 touch touch 5 294 183 shell 1 touch echo -n eval101 2 155 155 eval 1 1 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotParameter 0 echo -n wc -l wc -l 6 423 60 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 mapper system 7 510 181 awk $p $i > $o 1 1 1 sort system 8 556 193 sort -k1,1n $i > $o 1 1 header system 9 605 50 awk $p $i > $o 1 1 1 2 cols system 10 647 50 awk $p $i > $o 1 1 1 sortitem system 11 340 171 sortitem $i > $o 1 1 note 12 379 262 compute the explanations wc -l wc -l 13 703 51 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 for 14 699 158 3 3 1 iterate system 2 183 69 awk $p0 $i $p1 > $o 1 2 1 setstatus setstatus 3 268 71 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 part system 4 278 175 awk $p0 $i $p1 > $o 1 2 1 page rank system 5 388 187 pagerank $i > $o 1 1 for 6 466 269 2 3 1 impute system 2 214 123 awk $p0 $i $p1 > $o 1 2 1 awk system 3 93 29 awk $p0 $i $p1 > $o 1 2 1 setstatus setstatus 4 157 31 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotImage 1 2 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 0 2 OutSlotImage 0 0 InSlotImage 1 2 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 'BEGIN{line=ARGV[2];mv=ARGV[4];explanation=ARGV[6];ARGC=2}NR==line{for(i=1;i<=NF;i++)if($i==mv)printf("%d ",explanation);else printf("%d ",$i);printf("\n");next}{print}' 2 InSlotParameter 1 4 OutSlotResult 0 3 InSlotImage 0 0 OutSlotImage 1 3 InSlotParameter 0 'BEGIN{line=ARGV[2];ARGC--}NR==line{print;exit}' 3 InSlotParameter 1 0 OutSlotResult 0 4 InSlotImage 0 3 OutSlotImage 0 wc -l wc -l 7 470 177 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 note 8 447 121 impute the mv 0 InSlotImage 0 6 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 3 6 OutSlotImage 0 0 InSlotImage 0 6 OutSlotImage 0 0 InSlotImage 1 0 OutSlotImage 0 0 InSlotImage 2 0 OutSlotImage 1 0 InSlotImage 3 6 OutSlotImage 0 0 InSlotParameter 0 6 OutSlotResult 0 0 InSlotParameter 0 6 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 'BEGIN{line=ARGV[2];ARGC--}NR==line{print;exit}' 2 InSlotParameter 1 0 OutSlotResult 0 3 InSlotImage 0 2 OutSlotImage 0 4 InSlotImage 0 0 OutSlotImage 1 4 InSlotParameter 0 'BEGIN{first=ARGV[2];last=ARGV[3];ARGC-=2}first<=NR && NR<last{print}' 4 InSlotParameter 1 3 OutSlotResult 0 5 InSlotImage 0 4 OutSlotImage 0 6 InSlotImage 0 0 OutSlotImage 2 6 InSlotImage 1 5 OutSlotImage 0 6 InSlotParameter 0 1 6 InSlotParameter 1 7 OutSlotResult 0 6 InSlotParameter 2 1 7 InSlotImage 0 5 OutSlotImage 0 note 15 698 273 iterate over the lines and replace mv with their explanations head -1 system 16 772 135 head -1 $i > $o 1 1 setstatus setstatus 17 834 125 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 rename system 18 844 192 awk $p0 $i $p1 > $o 1 2 1 note 19 883 276 renaming the mv to ? mvsegmentation system 20 978 204 mvsegmentation $i $o 2 2 bin to csv system 21 1076 203 sed $p $i > $o 1 1 1 dictionary system 22 913 204 dictionary $i > $o 2 1 0 InSlotImage 0 21 OutSlotImage 0 0 InSlotImage 0 21 OutSlotImage 0 0 InSlotParameter 0 4 OutSlotResult 0 0 InSlotParameter 0 4 OutSlotResult 0 3 InSlotImage 0 0 OutSlotImage 0 4 InSlotImage 0 11 OutSlotImage 0 4 InSlotImage 1 3 OutSlotImage 1 4 InSlotImage 2 5 OutSlotImage 0 4 InSlotParameter 0 1 4 InSlotParameter 1 6 OutSlotResult 0 4 InSlotParameter 2 1 4 InSlotParameter 3 0 OutSlotResult 0 true 0 86 12 1 86 44 2 452 44 3 452 147 4 InSlotParameter 4 0 OutSlotResult 1 true 0 106 12 1 106 26 2 462 26 3 462 147 6 InSlotImage 0 3 OutSlotImage 1 7 InSlotImage 0 4 OutSlotImage 0 7 InSlotParameter 0 'BEGIN{FS=" : "}{l=split($3,tab," ");for(i=1;i<=l;i++)print tab[i] " : " $1 " : " l " : " $2}' 8 InSlotImage 0 7 OutSlotImage 0 9 InSlotImage 0 8 OutSlotImage 0 9 InSlotParameter 0 '{if($1!=line){line=$1;print NR}}END{print NR+1}' 10 InSlotImage 0 9 OutSlotImage 0 10 InSlotParameter 0 'NR==1{first=$1}NR!=1{print first,$1;first=$1}' 11 InSlotImage 0 3 OutSlotImage 0 13 InSlotImage 0 10 OutSlotImage 0 14 InSlotImage 0 10 OutSlotImage 0 14 InSlotImage 1 8 OutSlotImage 0 true 0 587 223 1 641 223 2 641 223 3 698 223 14 InSlotImage 2 3 OutSlotImage 0 true 0 247 200 1 348 200 2 348 234 3 698 234 14 InSlotParameter 0 1 14 InSlotParameter 1 13 OutSlotResult 0 14 InSlotParameter 2 1 16 InSlotImage 0 3 OutSlotImage 1 true 0 247 211 1 276 211 2 276 165 3 771 165 17 InSlotImage 0 16 OutSlotImage 0 18 InSlotImage 0 14 OutSlotImage 0 18 InSlotParameter 0 'BEGIN{new=ARGV[2];ARGC--}{printf("%d",$1);for(i=2;i<=NF;i++)if($i>new)printf(",?");else printf(",%d",$i);printf("\n");}' 18 InSlotParameter 1 17 OutSlotResult 0 20 InSlotImage 0 18 OutSlotImage 0 20 InSlotImage 1 22 OutSlotImage 0 21 InSlotImage 0 20 OutSlotImage 0 21 InSlotParameter 0 's/ /,/g;s/,$//' 22 InSlotImage 0 18 OutSlotImage 0 22 InSlotImage 1 0 OutSlotImage 1 mv detection system 3 136 44 awk -F, $p $i > $o 1 1 1 wc -l wc -l 4 270 46 shell 1 wc -l wc -l system 2 121 50 wc -l < $i > $o 1 1 setstatus setstatus 3 223 41 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 3 InSlotImage 0 2 OutSlotImage 0 if 5 272 114 $0 == 0 1 2 2 merge 6 459 126 2 1 0 InSlotImage 0 6 OutSlotImage 0 0 InSlotImage 0 6 OutSlotImage 0 0 InSlotParameter 0 6 OutSlotResult 0 0 InSlotParameter 0 6 OutSlotResult 0 2 InSlotImage 0 5 OutSlotImage 1 2 InSlotImage 1 0 OutSlotImage 1 true 0 15 106 1 35 106 2 35 178 3 347 178 2 InSlotParameter 0 0 OutSlotResult 0 true 0 86 12 1 86 45 2 360 45 3 360 125 2 InSlotParameter 1 0 OutSlotResult 1 3 InSlotImage 0 0 OutSlotImage 0 3 InSlotParameter 0 '{for(i=1;i<=NF;i++)if($i=="?")mv[i]=1}END{for(i in mv)print i}' 4 InSlotImage 0 3 OutSlotImage 0 5 InSlotImage 0 0 OutSlotImage 0 5 InSlotParameter 0 4 OutSlotResult 0 5 InSlotParameter 1 0 6 InSlotImage 0 5 OutSlotImage 0 6 InSlotImage 1 2 OutSlotImage 0 mv-density mv-density 17 357 421 missing values 1 mv-density mv density system 2 65 44 awk -F, $p $i > $o 1 1 1 setstatus setstatus 3 150 46 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 '{total+=NF;for(i=1;i<=NF;i++)if($i=="?")mv++}END{print mv/total}' 3 InSlotImage 0 2 OutSlotImage 0 mv-density mv-density 18 492 419 missing values 1 mv-density mv density system 2 65 44 awk -F, $p $i > $o 1 1 1 setstatus setstatus 3 150 46 shell 1 setstatus setstatus.sh 2 159 101 shell 1 0 InSlotParameter 0 2 OutSlotResult 0 0 InSlotParameter 0 2 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 0 InSlotParameter 0 3 OutSlotResult 0 0 InSlotParameter 0 3 OutSlotResult 0 2 InSlotImage 0 0 OutSlotImage 0 2 InSlotParameter 0 '{total+=NF;for(i=1;i<=NF;i++)if($i=="?")mv++}END{print mv/total}' 3 InSlotImage 0 2 OutSlotImage 0 heart-nom-missing-surfer-imputation.csv saver 19 470 484 ./data/heart-nom-missing-surfer-imputation.csv 1 1 1 heart-nom-missing.csv saver 20 207 476 ./data/heart-nom-missing.csv 1 1 1 heart-nom-missing-rule-imputation.csv saver 21 469 550 ./data/heart-nom-missing-rule-imputation.csv 1 1 1 11 InSlotImage 0 12 OutSlotImage 0 11 InSlotParameter 0 2 11 InSlotParameter 1 7 OutSlotResult 0 12 InSlotImage 0 8 OutSlotImage 0 12 InSlotParameter 0 6 OutSlotResult 0 12 InSlotParameter 1 10 OutSlotResult 0 13 InSlotImage 0 8 OutSlotImage 0 13 InSlotImage 1 15 OutSlotImage 0 13 InSlotParameter 0 14 OutSlotResult 0 15 InSlotImage 0 11 OutSlotImage 0 15 InSlotImage 1 9 OutSlotImage 0 15 InSlotParameter 0 4 OutSlotResult 0 15 InSlotParameter 1 3 OutSlotResult 0 15 InSlotParameter 2 5 OutSlotResult 0 16 InSlotImage 0 11 OutSlotImage 0 16 InSlotImage 1 9 OutSlotImage 0 16 InSlotParameter 0 2 OutSlotResult 0 16 InSlotParameter 1 1 OutSlotResult 0 17 InSlotImage 0 16 OutSlotImage 0 18 InSlotImage 0 15 OutSlotImage 0 19 InSlotImage 0 15 OutSlotImage 0 19 InSlotParameter 0 20 InSlotImage 0 11 OutSlotImage 0 20 InSlotParameter 0 21 InSlotImage 0 15 OutSlotImage 0 21 InSlotParameter 0