Program Listing for File preprocess_fil.hpp#

Return to documentation for file (python/morpheus/morpheus/_lib/include/morpheus/stages/preprocess_fil.hpp)

/*
 * SPDX-FileCopyrightText: Copyright (c) 2022-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: Apache-2.0
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#pragma once

#include "morpheus/export.h"                // for MORPHEUS_EXPORT
#include "morpheus/messages/control.hpp"    // for ControlMessage
#include "morpheus/objects/table_info.hpp"  // for TableInfo

#include <boost/fiber/context.hpp>  // for operator<<
#include <mrc/segment/builder.hpp>  // for Builder
#include <mrc/segment/object.hpp>   // for Object
#include <pymrc/node.hpp>           // for PythonNode
#include <rxcpp/rx.hpp>             // for trace_activity, decay_t, from

#include <memory>  // for shared_ptr
#include <string>  // for string
#include <thread>  // for operator<<
#include <vector>  // for vector

// IWYU pragma: no_include "rxcpp/sources/rx-iterate.hpp"

namespace morpheus {

/****** Component public implementations *******************/
/****** PreprocessFILStage**********************************/

class MORPHEUS_EXPORT PreprocessFILStage
  : public mrc::pymrc::PythonNode<std::shared_ptr<ControlMessage>, std::shared_ptr<ControlMessage>>
{
  public:
    using base_t = mrc::pymrc::PythonNode<std::shared_ptr<ControlMessage>, std::shared_ptr<ControlMessage>>;
    using typename base_t::sink_type_t;
    using typename base_t::source_type_t;
    using typename base_t::subscribe_fn_t;

    PreprocessFILStage(const std::vector<std::string>& features);

    source_type_t on_data(sink_type_t x);

  private:
    TableInfo fix_bad_columns(sink_type_t x);

    std::vector<std::string> m_fea_cols;
    std::string m_vocab_file;
};

/****** PreprocessFILStageInferenceProxy********************/
struct MORPHEUS_EXPORT PreprocessFILStageInterfaceProxy
{
    static std::shared_ptr<mrc::segment::Object<PreprocessFILStage>> init(mrc::segment::Builder& builder,
                                                                          const std::string& name,
                                                                          const std::vector<std::string>& features);
};  // end of group
}  // namespace morpheus