Source code for forte.processors.misc.attribute_masking_processor

# Copyright 2019 The Forte Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from typing import Any, Dict

from forte.common.configuration import Config
from forte.common.resources import Resources
from forte.data.data_pack import DataPack
from forte.processors.base import PackProcessor

__all__ = ["AttributeMasker"]

from forte.utils import get_class


[docs]class AttributeMasker(PackProcessor): def __init__(self): super().__init__() self.fields: Dict = {} # pylint: disable=attribute-defined-outside-init
[docs] def initialize(self, resources: Resources, configs: Config): super().initialize(resources, configs) for entry_type, entry_attributes in self.configs.requests.items(): entry_class = get_class(entry_type) self.fields[entry_class] = entry_attributes
[docs] @classmethod def default_configs(cls) -> Dict[str, Any]: r"""Default config for this processor. Example usage is shown below .. code-block:: python { "requests": { "ft.onto.base_ontology.Token": ["pos"] } } Here: - `"requests"`: dict The entry types and fields required. The keys of the requests dict are the entry types whose fields need to be masked and the value is a list of field names. """ return {"requests": {}, "@no_typecheck": {"requests"}}
def _process(self, input_pack: DataPack): for entry_type, attributes in self.fields.items(): for entry in input_pack.get_entries_of(entry_type): for attribute in attributes: setattr(entry, attribute, None)