Skip to content

Text Tags

nyckel.TextTagsFunction

Example:

from nyckel import Credentials, TextTagsFunction, TextTagsSample, TagsAnnotation

credentials = Credentials(client_id="...", client_secret="...")

func = TextTagsFunction.create("NewsTopics", credentials)
func.create_samples([
    TextTagsSample(data="This is the best restaurant in NYC.", annotation=[TagsAnnotation("Food"), TagsAnnotation("Reviews")]),
    TextTagsSample(data="The Belly-Up tavern in Solana Beach...", annotation=[TagsAnnotation("Music"), TagsAnnotation("Reviews")]),
    TextTagsSample(data="Here is how to make the best Pasta Carbonara.", annotation=[TagsAnnotation("Food")]),
    TextTagsSample(data="Taylor swift just released a new album, again.", annotation=[TagsAnnotation("Music")]),
])

predictions = func.invoke(["Swedish meatballs: the best recipes"])
Source code in src/nyckel/functions/tags/text_tags.py
class TextTagsFunction:
    """
    Example:

    ```py

    from nyckel import Credentials, TextTagsFunction, TextTagsSample, TagsAnnotation

    credentials = Credentials(client_id="...", client_secret="...")

    func = TextTagsFunction.create("NewsTopics", credentials)
    func.create_samples([
        TextTagsSample(data="This is the best restaurant in NYC.", annotation=[TagsAnnotation("Food"), TagsAnnotation("Reviews")]),
        TextTagsSample(data="The Belly-Up tavern in Solana Beach...", annotation=[TagsAnnotation("Music"), TagsAnnotation("Reviews")]),
        TextTagsSample(data="Here is how to make the best Pasta Carbonara.", annotation=[TagsAnnotation("Food")]),
        TextTagsSample(data="Taylor swift just released a new album, again.", annotation=[TagsAnnotation("Music")]),
    ])

    predictions = func.invoke(["Swedish meatballs: the best recipes"])
    ```
    """

    def __init__(self, function_id: NyckelId, credentials: Credentials):
        self._function_id = function_id

        self._function_handler = TagsFunctionHandler(function_id, credentials)
        self._label_handler = ClassificationLabelHandler(function_id, credentials)
        self._url_handler = TagsFunctionURLHandler(function_id, credentials.server_url)
        self._sample_handler = TagsSampleHandler(function_id, credentials)

        assert self._function_handler.get_input_modality() == "Text"

    def __str__(self) -> str:
        return self.__repr__()

    def __repr__(self) -> str:
        status_string = f"Name: {self.name}, id: {self.function_id}, url: {self._url_handler.train_page}"
        return status_string

    @property
    def function_id(self) -> str:
        return self._function_id

    @property
    def sample_count(self) -> int:
        return self._function_handler.sample_count

    @property
    def label_count(self) -> int:
        return self._function_handler.label_count

    @property
    def name(self) -> str:
        return self._function_handler.get_name()

    @classmethod
    def create(cls, name: str, credentials: Credentials) -> "TextTagsFunction":
        return tags_function_factory.TagsFunctionFactory().create(name, "Text", credentials)  # type:ignore

    def delete(self) -> None:
        self._function_handler.delete()

    def invoke(self, sample_data_list: List[str]) -> List[TagsPrediction]:
        """Invokes the trained function. Raises ValueError if function is not trained"""
        return self._sample_handler.invoke(sample_data_list, lambda x: x)  # type: ignore

    def has_trained_model(self) -> bool:
        return self._function_handler.is_trained

    def create_labels(self, labels: Sequence[Union[ClassificationLabel, str]]) -> List[NyckelId]:  # type:ignore
        typed_labels = [
            label if isinstance(label, ClassificationLabel) else ClassificationLabel(name=label)  # type:ignore
            for label in labels
        ]
        return self._label_handler.create_labels(typed_labels)

    def list_labels(self) -> List[ClassificationLabel]:
        return self._label_handler.list_labels(self.label_count)

    def read_label(self, label_id: NyckelId) -> ClassificationLabel:
        return self._label_handler.read_label(label_id)

    def update_label(self, label: ClassificationLabel) -> ClassificationLabel:
        return self._label_handler.update_label(label)

    def delete_labels(self, label_ids: List[NyckelId]) -> None:
        return self._label_handler.delete_labels(label_ids)

    def create_samples(self, samples: Sequence[Union[TextTagsSample, TextSampleData]]) -> List[NyckelId]:  # type:ignore
        typed_samples = self._wrangle_post_samples_input(samples)
        typed_samples = self._strip_label_names(typed_samples)
        self._create_labels_as_needed(typed_samples)

        return self._sample_handler.create_samples(typed_samples, lambda x: x)

    def _wrangle_post_samples_input(
        self, samples: Sequence[Union[TextTagsSample, TextSampleData]]
    ) -> List[TextTagsSample]:
        typed_samples: List[TextTagsSample] = []
        for sample in samples:
            if isinstance(sample, str):
                typed_samples.append(TextTagsSample(data=sample))
            elif isinstance(sample, TextTagsSample):
                typed_samples.append(sample)
            else:
                raise ValueError(f"Unknown sample type: {type(sample)}")
        return typed_samples

    def _strip_label_names(self, samples: List[TextTagsSample]) -> List[TextTagsSample]:
        for sample in samples:
            if sample.annotation:
                for entry in sample.annotation:
                    entry.label_name = entry.label_name.strip()
        return samples

    def _create_labels_as_needed(self, samples: List[TextTagsSample]) -> None:
        existing_labels = self._label_handler.list_labels(None)
        existing_label_names = {label.name for label in existing_labels}
        new_label_names: set = set()
        for sample in samples:
            if sample.annotation:
                new_label_names |= {annotation.label_name for annotation in sample.annotation}
        missing_label_names = new_label_names - existing_label_names
        missing_labels = [ClassificationLabel(name=label_name) for label_name in missing_label_names]
        if len(missing_labels) > 0:
            self._label_handler.create_labels(missing_labels)

    def list_samples(self) -> List[TextTagsSample]:
        samples_dict_list = self._sample_handler.list_samples(self.sample_count)
        labels = self._label_handler.list_labels(None)
        label_name_by_id = {label.id: label.name for label in labels}

        return [self._sample_from_dict(entry, label_name_by_id) for entry in samples_dict_list]  # type: ignore

    def _sample_from_dict(self, sample_dict: Dict, label_name_by_id: Dict[NyckelId, str]) -> TextTagsSample:
        if "annotation" in sample_dict:
            annotation = [
                TagsAnnotation(
                    label_name=label_name_by_id[strip_nyckel_prefix(entry["labelId"])],
                    present=entry["present"],
                )
                for entry in sample_dict["annotation"]
            ]
        else:
            annotation = None

        if "prediction" in sample_dict:
            prediction = [
                ClassificationPrediction(
                    confidence=entry["confidence"],
                    label_name=label_name_by_id[strip_nyckel_prefix(entry["labelId"])],
                )
                for entry in sample_dict["prediction"]
            ]
        else:
            prediction = None

        return TextTagsSample(
            id=strip_nyckel_prefix(sample_dict["id"]),
            data=sample_dict["data"],
            external_id=sample_dict["externalId"] if "externalId" in sample_dict else None,
            annotation=annotation,
            prediction=prediction,
        )

    def read_sample(self, sample_id: NyckelId) -> TextTagsSample:
        sample_dict = self._sample_handler.read_sample(sample_id)

        labels = self._label_handler.list_labels(None)
        label_name_by_id = {strip_nyckel_prefix(label.id): label.name for label in labels}  # type: ignore

        return self._sample_from_dict(sample_dict, label_name_by_id)  # type: ignore

    def update_annotation(self, sample: TextTagsSample) -> None:
        self._sample_handler.update_annotation(sample)

    def delete_samples(self, sample_ids: List[NyckelId]) -> None:
        self._sample_handler.delete_samples(sample_ids)

function_id property

function_id: str

sample_count property

sample_count: int

label_count property

label_count: int

name property

name: str

__init__

__init__(function_id: NyckelId, credentials: Credentials)
Source code in src/nyckel/functions/tags/text_tags.py
def __init__(self, function_id: NyckelId, credentials: Credentials):
    self._function_id = function_id

    self._function_handler = TagsFunctionHandler(function_id, credentials)
    self._label_handler = ClassificationLabelHandler(function_id, credentials)
    self._url_handler = TagsFunctionURLHandler(function_id, credentials.server_url)
    self._sample_handler = TagsSampleHandler(function_id, credentials)

    assert self._function_handler.get_input_modality() == "Text"

create classmethod

create(name: str, credentials: Credentials) -> TextTagsFunction
Source code in src/nyckel/functions/tags/text_tags.py
@classmethod
def create(cls, name: str, credentials: Credentials) -> "TextTagsFunction":
    return tags_function_factory.TagsFunctionFactory().create(name, "Text", credentials)  # type:ignore

delete

delete() -> None
Source code in src/nyckel/functions/tags/text_tags.py
def delete(self) -> None:
    self._function_handler.delete()

invoke

invoke(sample_data_list: List[str]) -> List[TagsPrediction]

Invokes the trained function. Raises ValueError if function is not trained

Source code in src/nyckel/functions/tags/text_tags.py
def invoke(self, sample_data_list: List[str]) -> List[TagsPrediction]:
    """Invokes the trained function. Raises ValueError if function is not trained"""
    return self._sample_handler.invoke(sample_data_list, lambda x: x)  # type: ignore

has_trained_model

has_trained_model() -> bool
Source code in src/nyckel/functions/tags/text_tags.py
def has_trained_model(self) -> bool:
    return self._function_handler.is_trained

create_labels

create_labels(labels: Sequence[Union[ClassificationLabel, str]]) -> List[NyckelId]
Source code in src/nyckel/functions/tags/text_tags.py
def create_labels(self, labels: Sequence[Union[ClassificationLabel, str]]) -> List[NyckelId]:  # type:ignore
    typed_labels = [
        label if isinstance(label, ClassificationLabel) else ClassificationLabel(name=label)  # type:ignore
        for label in labels
    ]
    return self._label_handler.create_labels(typed_labels)

list_labels

list_labels() -> List[ClassificationLabel]
Source code in src/nyckel/functions/tags/text_tags.py
def list_labels(self) -> List[ClassificationLabel]:
    return self._label_handler.list_labels(self.label_count)

read_label

read_label(label_id: NyckelId) -> ClassificationLabel
Source code in src/nyckel/functions/tags/text_tags.py
def read_label(self, label_id: NyckelId) -> ClassificationLabel:
    return self._label_handler.read_label(label_id)

update_label

update_label(label: ClassificationLabel) -> ClassificationLabel
Source code in src/nyckel/functions/tags/text_tags.py
def update_label(self, label: ClassificationLabel) -> ClassificationLabel:
    return self._label_handler.update_label(label)

delete_labels

delete_labels(label_ids: List[NyckelId]) -> None
Source code in src/nyckel/functions/tags/text_tags.py
def delete_labels(self, label_ids: List[NyckelId]) -> None:
    return self._label_handler.delete_labels(label_ids)

create_samples

create_samples(samples: Sequence[Union[TextTagsSample, TextSampleData]]) -> List[NyckelId]
Source code in src/nyckel/functions/tags/text_tags.py
def create_samples(self, samples: Sequence[Union[TextTagsSample, TextSampleData]]) -> List[NyckelId]:  # type:ignore
    typed_samples = self._wrangle_post_samples_input(samples)
    typed_samples = self._strip_label_names(typed_samples)
    self._create_labels_as_needed(typed_samples)

    return self._sample_handler.create_samples(typed_samples, lambda x: x)

list_samples

list_samples() -> List[TextTagsSample]
Source code in src/nyckel/functions/tags/text_tags.py
def list_samples(self) -> List[TextTagsSample]:
    samples_dict_list = self._sample_handler.list_samples(self.sample_count)
    labels = self._label_handler.list_labels(None)
    label_name_by_id = {label.id: label.name for label in labels}

    return [self._sample_from_dict(entry, label_name_by_id) for entry in samples_dict_list]  # type: ignore

read_sample

read_sample(sample_id: NyckelId) -> TextTagsSample
Source code in src/nyckel/functions/tags/text_tags.py
def read_sample(self, sample_id: NyckelId) -> TextTagsSample:
    sample_dict = self._sample_handler.read_sample(sample_id)

    labels = self._label_handler.list_labels(None)
    label_name_by_id = {strip_nyckel_prefix(label.id): label.name for label in labels}  # type: ignore

    return self._sample_from_dict(sample_dict, label_name_by_id)  # type: ignore

update_annotation

update_annotation(sample: TextTagsSample) -> None
Source code in src/nyckel/functions/tags/text_tags.py
def update_annotation(self, sample: TextTagsSample) -> None:
    self._sample_handler.update_annotation(sample)

delete_samples

delete_samples(sample_ids: List[NyckelId]) -> None
Source code in src/nyckel/functions/tags/text_tags.py
def delete_samples(self, sample_ids: List[NyckelId]) -> None:
    self._sample_handler.delete_samples(sample_ids)

nyckel.TextTagsSample dataclass

Source code in src/nyckel/functions/tags/tags.py
@dataclass
class TextTagsSample:
    data: TextSampleData
    id: Optional[NyckelId] = None
    external_id: Optional[str] = None
    annotation: Optional[List[TagsAnnotation]] = None
    prediction: Optional[List[ClassificationPrediction]] = None

data instance-attribute

id class-attribute instance-attribute

id: Optional[NyckelId] = None

external_id class-attribute instance-attribute

external_id: Optional[str] = None

annotation class-attribute instance-attribute

annotation: Optional[List[TagsAnnotation]] = None

prediction class-attribute instance-attribute

prediction: Optional[List[ClassificationPrediction]] = None

__init__

__init__(data: TextSampleData, id: Optional[NyckelId] = None, external_id: Optional[str] = None, annotation: Optional[List[TagsAnnotation]] = None, prediction: Optional[List[ClassificationPrediction]] = None) -> None

nyckel.TextSampleData module-attribute

TextSampleData = str