天天看点

java8-08-自定义Collector-groupBy声明简单实现简化代码使用自定义Collector博客源码

  • 声明
  • 简单实现
  • 简化代码
  • 使用自定义Collector
  • 博客源码

声明

这一系列文章旨在帮助大家理解

Collector

的执行流程,至于实现的是否高效、是否优雅、是否合理等暂且不论。

现在来实现一个和

java.util.stream.Collectors#groupingBy()

一样效果的

GroupByCollector

当然此处的实现肯定没有jdk那样灵活,效率就先不提了,至少贫道的这个实现不支持多级分组V_V。

若对

Collector

的各个流程有疑问请移驾此处:http://blog.csdn.net/hylexus/article/details/78941843

简单实现

// 这个是从jdk8源码里提出来的一个 Characteristics
// 只包含一个恒等函数的Characteristics
static final Set<Collector.Characteristics> CH_ID
        = Collections.unmodifiableSet(EnumSet.of(Collector.Characteristics.IDENTITY_FINISH));
           
static class GroupByCollector<T, K> implements Collector<T, Map<K, List<T>>, Map<K, List<T>>> {

    Function<T, K> classifier;

    public GroupByCollector(Function<T, K> classifier) {
        this.classifier = classifier;
    }

    @Override
    public Supplier<Map<K, List<T>>> supplier() {
        return () -> new HashMap<>();
    }

    @Override
    public BiConsumer<Map<K, List<T>>, T> accumulator() {
        return (map, e) -> {
            K key = classifier.apply(e);
            List<T> value = map.get(key);
            if (map.get(key) == null) {
                map.put(key, Lists.newArrayList());
            }

            map.get(key).add(e);
        };
    }

    @Override
    public BinaryOperator<Map<K, List<T>>> combiner() {
        return (map1, map2) -> {
            map2.forEach((k, v) -> {
                if (map1.get(k) == null) {
                    map1.put(k, v);
                } else {
                    map1.get(k).addAll(v);
                }
            });
            return map1;
        };
    }

    @Override
    public Function<Map<K, List<T>>, Map<K, List<T>>> finisher() {
        return Function.identity();
    }

    @Override
    public Set<Characteristics> characteristics() {
        return CH_ID;
    }
}
           

简化代码

static class GroupByCollector2<T, K> implements Collector<T, Map<K, List<T>>, Map<K, List<T>>> {
    Function<T, K> classifier;

    public GroupByCollector2(Function<T, K> classifier) {
        this.classifier = classifier;
    }

    @Override
    public Supplier<Map<K, List<T>>> supplier() {
        return HashMap::new;
    }

    @Override
    public BiConsumer<Map<K, List<T>>, T> accumulator() {
        return (map, e) -> {
            K key = classifier.apply(e);
            List<T> value = Optional.ofNullable(map)
              .map(m -> m.get(key)).orElse(Lists.newArrayList());
            value.add(e);
            map.put(key, value);
        };
    }

    @Override
    public BinaryOperator<Map<K, List<T>>> combiner() {
        return (m1, m2) -> {
            m2.forEach((k, v) -> {
                List<T> value = Optional.ofNullable(m1)
                  .map(m -> m.get(k)).orElse(Lists.newArrayList());
                value.addAll(v);
                m1.put(k, value);
            });

            return m1;
        };
    }

    @Override
    public Function<Map<K, List<T>>, Map<K, List<T>>> finisher() {
        return Function.identity();
    }

    @Override
    public Set<Characteristics> characteristics() {
        return CH_ID;
    }
}
           

使用自定义Collector

static class User {
    private Integer id;
    private String name;
    private Integer gender;
    private Integer age;

    User(Integer id, String name, Integer gender, Integer age) {
        this.id = id;
        this.name = name;
        this.gender = gender;
        this.age = age;
    }
    // getter,setter
}

List<User> users = Lists.newArrayList(
        new User(, "java", , ),
        new User(, "C", , ),
        new User(, "scala", , ),
        new User(, "C++", , ),
        new User(, "Spark", , ),
        new User(, "PHP", , ),
        new User(, "Python", , ),
        new User(, "JavaScript", , ),
        new User(, "C#", , )
);

void printUserMap(Map<Integer, List<User>> map) {
    map.forEach((k, v) -> {
        System.out.println(k);
        v.forEach(e-> System.out.println("\t"+e));
    });
}

@Test
public void test2() {
    Map<Integer, List<User>> map = users.stream()
      .collect(Collectors.groupingBy(User::getGender));
    printUserMap(map);

    map = users.stream().
      collect(new GroupByCollector<>(User::getGender));
    printUserMap(map);

    map = users.stream().collect(new GroupByCollector2<>(User::getGender));
    printUserMap(map);

}
           
  • 输出效果
User{id=, name='scala', gender=, age=}
    User{id=, name='C++', gender=, age=}
    User{id=, name='PHP', gender=, age=}
    User{id=, name='JavaScript', gender=, age=}

    User{id=, name='java', gender=, age=}
    User{id=, name='C', gender=, age=}
    User{id=, name='Spark', gender=, age=}
    User{id=, name='Python', gender=, age=}
    User{id=, name='C#', gender=1, age=33}
           

博客源码

https://github.com/hylexus/blog-src/blob/master/java-core/src/test/java/cn/hylexus/lambda/CollectorTest.java