[ https://issues.apache.org/jira/browse/NIFI-1682?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15805566#comment-15805566 ]
ASF GitHub Bot commented on NIFI-1682: -------------------------------------- Github user pvillard31 commented on a diff in the pull request: https://github.com/apache/nifi/pull/1328#discussion_r95008584 --- Diff: nifi-nar-bundles/nifi-stateful-analysis-bundle/nifi-stateful-analysis-processors/src/main/java/org/apache/nifi/processors/stateful/analysis/AttributeRollingWindow.java --- @@ -0,0 +1,325 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package org.apache.nifi.processors.stateful.analysis; + +import org.apache.nifi.annotation.behavior.InputRequirement; +import org.apache.nifi.annotation.behavior.Stateful; +import org.apache.nifi.annotation.behavior.TriggerSerially; +import org.apache.nifi.annotation.behavior.WritesAttribute; +import org.apache.nifi.annotation.behavior.WritesAttributes; +import org.apache.nifi.annotation.documentation.CapabilityDescription; +import org.apache.nifi.annotation.documentation.Tags; +import org.apache.nifi.annotation.lifecycle.OnScheduled; +import org.apache.nifi.components.PropertyDescriptor; +import org.apache.nifi.components.state.Scope; +import org.apache.nifi.components.state.StateManager; +import org.apache.nifi.components.state.StateMap; +import org.apache.nifi.flowfile.FlowFile; +import org.apache.nifi.processor.AbstractProcessor; +import org.apache.nifi.processor.ProcessContext; +import org.apache.nifi.processor.ProcessSession; +import org.apache.nifi.processor.Relationship; +import org.apache.nifi.processor.exception.ProcessException; +import org.apache.nifi.processor.util.StandardValidators; + +import java.io.IOException; +import java.util.ArrayList; +import java.util.Collections; +import java.util.HashMap; +import java.util.HashSet; +import java.util.List; +import java.util.Map; +import java.util.Set; +import java.util.concurrent.TimeUnit; + +import static org.apache.nifi.processors.stateful.analysis.AttributeRollingWindow.ROLLING_WINDOW_COUNT_KEY; +import static org.apache.nifi.processors.stateful.analysis.AttributeRollingWindow.ROLLING_WINDOW_VALUE_KEY; + +@TriggerSerially +@InputRequirement(InputRequirement.Requirement.INPUT_REQUIRED) +@Tags({"Attribute Expression Language", "state", "data science", "rolling", "window"}) +@CapabilityDescription("Track a Rolling Window based on evaluating an Expression Language expression on each FlowFile and add that value to the processor's state. Each FlowFile will be emitted " + + "with the count of FlowFiles and total aggregate value of values processed in the current time window.") +@WritesAttributes({ + @WritesAttribute(attribute = ROLLING_WINDOW_VALUE_KEY, description = "The rolling window value (sum of all the values stored)."), + @WritesAttribute(attribute = ROLLING_WINDOW_COUNT_KEY, description = "The count of the number of FlowFiles seen in the rolling window.") +}) +@Stateful(scopes = {Scope.LOCAL}, description = "Store the values backing the rolling window. This includes storing the individual values and their time-stamps or the batches of values and their " + + "counts.") +public class AttributeRollingWindow extends AbstractProcessor { + + public static final String COUNT_KEY = "count"; + public static final String ROLLING_WINDOW_VALUE_KEY = "rolling_window_value"; + public static final String ROLLING_WINDOW_COUNT_KEY = "rolling_window_count"; + + public static final String CURRENT_MICRO_BATCH_STATE_TS_KEY = "start_curr_batch_ts"; + public static final String BATCH_APPEND_KEY = "_batch"; + public static final String COUNT_APPEND_KEY = "_count"; + public static final int COUNT_APPEND_KEY_LENGTH = 6; + + static final PropertyDescriptor VALUE_TO_TRACK = new PropertyDescriptor.Builder() + .name("Value to track") --- End diff -- Use .displayName() in addition to .name()? > Processor to do Rolling Window calculations using FlowFile attributes > --------------------------------------------------------------------- > > Key: NIFI-1682 > URL: https://issues.apache.org/jira/browse/NIFI-1682 > Project: Apache NiFi > Issue Type: New Feature > Reporter: Joseph Percivall > Assignee: Joseph Percivall > > Using state it is now possible to store a map of key value pairs up to 1mb. > Taking into account storing a timestamp string and a double converted to a > string this is on the order of 5000 values. This enables a processor that can > store a rolling window of values to calculate things such as a rolling mean. -- This message was sent by Atlassian JIRA (v6.3.4#6332)