Grouping Data in a List/Hashmap

Question

I am having a file like this

Petal_Length    0   1.3 - 2.42
Petal_Length    1   2.42 - 3.54
Petal_Length    2   3.54 - 4.66
Petal_Length    3   4.66 - 5.78
Petal_Length    4   5.78 - 6.9
Petal_Width     5   0.3 - 0.76
Petal_Width     6   0.76 - 1.2200000000000002
Petal_Width     7   1.2200000000000002 - 1.6800000000000002
Petal_Width     8   1.6800000000000002 - 2.14
Petal_Width     9   2.14 - 2.6
Sepal_Length    10  4.3 - 5.02
Sepal_Length    11  5.02 - 5.739999999999999
Sepal_Length    12  5.739999999999999 - 6.459999999999999
Sepal_Length    13  6.459999999999999 - 7.179999999999999
Sepal_Length    14  7.179999999999999 - 7.899999999999999
Sepal_Width     15  2.3 - 2.76
Sepal_Width     16  2.76 - 3.2199999999999998
Sepal_Width     17  3.2199999999999998 - 3.6799999999999997
Sepal_Width     18  3.6799999999999997 - 4.14
Sepal_Width     19  4.14 - 4.6

I am trying to group these data as

Petal_Length[0:1.3 - 2.42,1:2.42 - 3.54,2:3.54 - 4.66,3:4.66 - 5.78,4:5.78 - 6.9]

Is that the way of grouping . My aim is to get the attribute name index and the range.

Whether to use hashmap?

UPDATE

What I did is -

       while((line = bf.readLine())!=null){
        String featureVal[] = line.split("	");
        val.add(featureVal[0]);
        listToSet = new HashSet(val);
        //Creating Arraylist without duplicate values
        attributeVal = new ArrayList(listToSet);
        //Extracting key
        binMap.put(featureVal[0], new ArrayList());
        //Extracting Values
        String[] cols = featureVal[1].split("	");
        for(int i = 0; i < cols.length; i++) {
            if(attributeVal.get(i).equals(cols[i])){
                System.out.println("in foorlop");
                List tmpList = binMap.get(attributeVal.get(i));
                if(tmpList == null) {
                    tmpList = new ArrayList();
                }
                System.out.println("cols[i]"+cols[i]);
                tmpList.add(cols[i]);
                //Get the list and add to that list instead of creating new temp list
                binMap.put(attributeVal.get(i), tmpList);
            }
        }
        System.out.println("binMap: "+binMap);

    }

But my output is null

binMap: {Petal_Width=[], Sepal_Length=[], Petal_Length=[], Sepal_Width=[]}

Please suggest.

Igor Katkov · Accepted Answer

Here is sample code for you, please note how there are domain classes like Range and Attribute are used for string parsing convenience. All the grouping is done via regular java map.

import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;


public class PetalGrouping {
    private static final String input = "Petal_Length	0	1.3 - 2.42
"
        + "Petal_Length	1	2.42 - 3.54
"
        + "Petal_Length	2	3.54 - 4.66
"
        + "Petal_Length	3	4.66 - 5.78
"
        + "Petal_Length	4	5.78 - 6.9
"
        + "Petal_Width	 5	0.3 - 0.76
"
        + "Petal_Width	 6	0.76 - 1.2200000000000002
"
        + "Petal_Width	 7	1.2200000000000002 - 1.6800000000000002
"
        + "Petal_Width	 8	1.6800000000000002 - 2.14
"
        + "Petal_Width	 9	2.14 - 2.6
"
        + "Sepal_Length	10	4.3 - 5.02
"
        + "Sepal_Length	11	5.02 - 5.739999999999999
"
        + "Sepal_Length	12	5.739999999999999 - 6.459999999999999
"
        + "Sepal_Length	13	6.459999999999999 - 7.179999999999999
"
        + "Sepal_Length	14	7.179999999999999 - 7.899999999999999
"
        + "Sepal_Width	 15	2.3 - 2.76
"
        + "Sepal_Width	 16	2.76 - 3.2199999999999998
"
        + "Sepal_Width	 17	3.2199999999999998 - 3.6799999999999997
"
        + "Sepal_Width	 18	3.6799999999999997 - 4.14
"
        + "Sepal_Width	 19	4.14 - 4.6";

public static void main(String... args) {
    Map> map = new HashMap>();
    String[] lines = input.split("
");
    for (String line : lines) {
        Attribute attribute = Attribute.parse(line);
        List attributeList = map.get(attribute.getName());
        if (attributeList == null) {
            attributeList = new ArrayList();
            map.put(attribute.getName(), attributeList);
        }
        attributeList.add(attribute);
    }
    System.out.println(map);
}


}

class Range {
private double from;
private double to;

private Range(double from, double to) {
    this.from = from;
    this.to = to;
}

public static Range parse(String string) {
    String[] parts = string.split(" ");
    if (parts.length != 3) { throw new RuntimeException("Parsing failed for line: " + string); }
    return new Range(Double.parseDouble(parts[0].trim()), Double.parseDouble(parts[2].trim()));
}

@Override
public String toString() {
    return "{from=" + from + ", to=" + to + '}';
}
}

class Attribute {
private String name;
private int index;
private Range range;

protected Attribute(String name, int index, Range range) {
    this.name = name;
    this.index = index;
    this.range = range;
}

public static Attribute parse(String line) {
    String[] lineParts = line.split("	");
    if (lineParts.length != 3) { throw new RuntimeException("Parsing failed for line: " + line); }
    String name = lineParts[0].trim();
    int index = Integer.parseInt(lineParts[1].trim());
    Range range = Range.parse(lineParts[2].trim());
    return new Attribute(name, index, range);
}

@Override
public String toString() {
    return "index=" + index + " " + range + '}';
}

public String getName() {
    return name;
}
}

Grouping Data in a List/Hashmap

Answers (2)

Related Questions