JyAbacusWCPlugIN.py 1.3 KB

123456789101112131415161718192021222324252627282930313233343536
  1. #
  2. # Licensed to the Apache Software Foundation (ASF) under one
  3. # or more contributor license agreements. See the NOTICE file
  4. # distributed with this work for additional information
  5. # regarding copyright ownership. The ASF licenses this file
  6. # to you under the Apache License, Version 2.0 (the
  7. # "License"); you may not use this file except in compliance
  8. # with the License. You may obtain a copy of the License at
  9. #
  10. # http://www.apache.org/licenses/LICENSE-2.0
  11. #
  12. # Unless required by applicable law or agreed to in writing, software
  13. # distributed under the License is distributed on an "AS IS" BASIS,
  14. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. # See the License for the specific language governing permissions and
  16. # limitations under the License.
  17. #
  18. from org.apache.hadoop.fs import Path
  19. from org.apache.hadoop.io import *
  20. from org.apache.hadoop.mapred import *
  21. from org.apache.hadoop.abacus import *;
  22. from java.util import *;
  23. import sys
  24. class AbacusWordCount(ValueAggregatorBaseDescriptor):
  25. def generateKeyValPairs(self, key, val):
  26. retv = ArrayList();
  27. for w in val.toString().split():
  28. en = ValueAggregatorBaseDescriptor.generateEntry(ValueAggregatorBaseDescriptor.LONG_VALUE_SUM, w, ValueAggregatorBaseDescriptor.ONE);
  29. retv.add(en);
  30. return retv;