Program Listing for File preprocess_fil.hpp
↰ Return to documentation for file (morpheus/_lib/include/morpheus/stages/preprocess_fil.hpp
)
/*
* SPDX-FileCopyrightText: Copyright (c) 2021-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
* SPDX-License-Identifier: Apache-2.0
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#pragma once
#include "morpheus/export.h"
#include "morpheus/messages/control.hpp"
#include "morpheus/messages/multi.hpp"
#include "morpheus/messages/multi_inference.hpp"
#include "morpheus/objects/table_info.hpp"
#include <boost/fiber/context.hpp>
#include <mrc/segment/builder.hpp>
#include <mrc/segment/object.hpp>
#include <pymrc/node.hpp>
#include <rxcpp/rx.hpp>
#include <memory>
#include <string>
#include <thread>
#include <vector>
// IWYU pragma: no_include "rxcpp/sources/rx-iterate.hpp"
namespace morpheus {
/****** Component public implementations *******************/
/****** PreprocessFILStage**********************************/
template <typename InputT, typename OutputT>
class MORPHEUS_EXPORT PreprocessFILStage
: public mrc::pymrc::PythonNode<std::shared_ptr<InputT>, std::shared_ptr<OutputT>>
{
public:
using base_t = mrc::pymrc::PythonNode<std::shared_ptr<InputT>, std::shared_ptr<OutputT>>;
using typename base_t::sink_type_t;
using typename base_t::source_type_t;
using typename base_t::subscribe_fn_t;
PreprocessFILStage(const std::vector<std::string>& features);
source_type_t on_data(sink_type_t x);
private:
std::shared_ptr<MultiInferenceMessage> on_multi_message(std::shared_ptr<MultiMessage> x);
std::shared_ptr<ControlMessage> on_control_message(std::shared_ptr<ControlMessage> x);
void transform_bad_columns(std::vector<std::string>& fea_cols, morpheus::MutableTableInfo& mutable_info);
TableInfo fix_bad_columns(sink_type_t x);
std::vector<std::string> m_fea_cols;
std::string m_vocab_file;
};
using PreprocessFILStageMM = // NOLINT(readability-identifier-naming)
PreprocessFILStage<MultiMessage, MultiInferenceMessage>;
using PreprocessFILStageCM = // NOLINT(readability-identifier-naming)
PreprocessFILStage<ControlMessage, ControlMessage>;
/****** PreprocessFILStageInferenceProxy********************/
struct MORPHEUS_EXPORT PreprocessFILStageInterfaceProxy
{
static std::shared_ptr<mrc::segment::Object<PreprocessFILStage<MultiMessage, MultiInferenceMessage>>> init_multi(
mrc::segment::Builder& builder, const std::string& name, const std::vector<std::string>& features);
static std::shared_ptr<mrc::segment::Object<PreprocessFILStage<ControlMessage, ControlMessage>>> init_cm(
mrc::segment::Builder& builder, const std::string& name, const std::vector<std::string>& features);
}; // end of group
} // namespace morpheus