summaryrefslogtreecommitdiffstats
path: root/examples/svm-countdistinct.awk
blob: 7362f398ae42427383ba9f54f833efa6dcb44638 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
BEGIN {
    MAXUNIQUE = 100
}
1 {
    for (i=2; i<=NF; i++) {
        s = index($i, ":")
        feature = substr($i, 1, s - 1)
        if (feature in values && length(values[feature]) == MAXUNIQUE)
          continue
        value = substr($i, s + 1)
        values[feature][value] = 1
    }
}
END {
    for (k in values)
        print k, length(values[k])
}