JyAbacusWCPlugIN.py
上传用户:quxuerui
上传日期:2018-01-08
资源大小:41811k
文件大小:1k
- #
- # Licensed to the Apache Software Foundation (ASF) under one
- # or more contributor license agreements. See the NOTICE file
- # distributed with this work for additional information
- # regarding copyright ownership. The ASF licenses this file
- # to you under the Apache License, Version 2.0 (the
- # "License"); you may not use this file except in compliance
- # with the License. You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- from org.apache.hadoop.fs import Path
- from org.apache.hadoop.io import *
- from org.apache.hadoop.mapred import *
- from org.apache.hadoop.abacus import *;
- from java.util import *;
- import sys
- class AbacusWordCount(ValueAggregatorBaseDescriptor):
- def generateKeyValPairs(self, key, val):
- retv = ArrayList();
- for w in val.toString().split():
- en = ValueAggregatorBaseDescriptor.generateEntry(ValueAggregatorBaseDescriptor.LONG_VALUE_SUM, w, ValueAggregatorBaseDescriptor.ONE);
- retv.add(en);
- return retv;