Services¶

`backchannel` `special` ¶

`PytorchAcousticBackchanneler` ¶

`PytorchAcousticBackchanneler (Module)` ¶

Class for defining the Deep Backchannel model in PyTorch

Source code in adviser/services/backchannel/PytorchAcousticBackchanneler.py

class PytorchAcousticBackchanneler(nn.Module):
    """Class for defining the Deep Backchannel model in PyTorch"""

    def __init__(self, parameters:list=[], load_params:bool=False):
        """
        Defines the elements/layers of the neural network as well as loads the pretrained parameters

        The model is constituted by two parallel CNNs followed by a concatenation, a  FFN and a softmax layer.

        Args:
            parameters (list): list of pre-trained parameters to be used for prediction
            load_params (bool): Bool to signal if params should be loaded
        """
        super(PytorchAcousticBackchanneler, self).__init__()

        # First CNN
        cnn = nn.Conv2d(in_channels=1, out_channels=16, kernel_size=(11, 13), stride=(3,1))
        if load_params:
            weights = np.transpose(parameters[0][0], (3, 2, 0, 1))
            cnn.weight = torch.nn.Parameter(torch.tensor(weights).float())
            cnn.bias = torch.nn.Parameter(torch.tensor(parameters[0][1]).float())

        self.cnn1 = nn.Sequential(
            cnn,
            nn.ReLU(),
            nn.MaxPool2d((23, 1))
        )

        # Second CNN
        cnn = nn.Conv2d(in_channels=1, out_channels=16, kernel_size = (12, 13), stride=(3,1))
        if load_params:
            weights = np.transpose(parameters[1][0], (3,2,0,1))
            cnn.weight = torch.nn.Parameter(torch.tensor(weights).float())
            cnn.bias = torch.nn.Parameter(torch.tensor(parameters[1][1]).float())
        self.cnn2 = nn.Sequential(
            cnn,
            nn.ReLU(),
            nn.MaxPool2d((23, 1))
        )

        # Linear layer
        self.linear1 = nn.Linear(in_features=64, out_features=100)
        if load_params:
            self.linear1.weight = torch.nn.Parameter(torch.tensor(parameters[2][0].T).float())
            self.linear1.bias = torch.nn.Parameter(torch.tensor(parameters[2][1]).float())
        self.relu = nn.ReLU()
        self.dropout = nn.Dropout(0.5)

        # Softmax
        self.linear2 = nn.Linear(in_features=100, out_features=3)
        if load_params:
            self.linear2.weight = torch.nn.Parameter(torch.tensor(parameters[3][0].T).float())
            self.linear2.bias = torch.nn.Parameter(torch.tensor(parameters[3][1]).float())
        self.softmax = nn.Softmax(dim=1)

    def forward(self, feat_inputs):
        """
        PyTorch forward method used for training and prediction. It defines the interaction between layers.
        Args:
            feat_inputs (numpy array): It contains the network's input.

        Returns:
            out (torch.tensor): Network's output
        """
        feat_inputs = torch.tensor(feat_inputs).float()
        feat_inputs = feat_inputs.unsqueeze(1)
        cnn_1 = self.cnn1(feat_inputs)
        cnn_1 = cnn_1.flatten(1)
        cnn_2 = self.cnn2(feat_inputs).flatten(1)
        out = torch.cat((cnn_1, cnn_2), 1)
        out = self.linear1(out)
        out = self.relu(out)
        out = self.dropout(out)
        out = self.linear2(out)
        out = self.softmax(out)
        return out

`init(self, parameters=[], load_params=False)` `special` ¶

Defines the elements/layers of the neural network as well as loads the pretrained parameters

The model is constituted by two parallel CNNs followed by a concatenation, a FFN and a softmax layer.

Parameters:

Name	Type	Description	Default
`parameters`	`list`	list of pre-trained parameters to be used for prediction	`[]`
`load_params`	`bool`	Bool to signal if params should be loaded	`False`

Source code in adviser/services/backchannel/PytorchAcousticBackchanneler.py

def __init__(self, parameters:list=[], load_params:bool=False):
    """
    Defines the elements/layers of the neural network as well as loads the pretrained parameters

    The model is constituted by two parallel CNNs followed by a concatenation, a  FFN and a softmax layer.

    Args:
        parameters (list): list of pre-trained parameters to be used for prediction
        load_params (bool): Bool to signal if params should be loaded
    """
    super(PytorchAcousticBackchanneler, self).__init__()

    # First CNN
    cnn = nn.Conv2d(in_channels=1, out_channels=16, kernel_size=(11, 13), stride=(3,1))
    if load_params:
        weights = np.transpose(parameters[0][0], (3, 2, 0, 1))
        cnn.weight = torch.nn.Parameter(torch.tensor(weights).float())
        cnn.bias = torch.nn.Parameter(torch.tensor(parameters[0][1]).float())

    self.cnn1 = nn.Sequential(
        cnn,
        nn.ReLU(),
        nn.MaxPool2d((23, 1))
    )

    # Second CNN
    cnn = nn.Conv2d(in_channels=1, out_channels=16, kernel_size = (12, 13), stride=(3,1))
    if load_params:
        weights = np.transpose(parameters[1][0], (3,2,0,1))
        cnn.weight = torch.nn.Parameter(torch.tensor(weights).float())
        cnn.bias = torch.nn.Parameter(torch.tensor(parameters[1][1]).float())
    self.cnn2 = nn.Sequential(
        cnn,
        nn.ReLU(),
        nn.MaxPool2d((23, 1))
    )

    # Linear layer
    self.linear1 = nn.Linear(in_features=64, out_features=100)
    if load_params:
        self.linear1.weight = torch.nn.Parameter(torch.tensor(parameters[2][0].T).float())
        self.linear1.bias = torch.nn.Parameter(torch.tensor(parameters[2][1]).float())
    self.relu = nn.ReLU()
    self.dropout = nn.Dropout(0.5)

    # Softmax
    self.linear2 = nn.Linear(in_features=100, out_features=3)
    if load_params:
        self.linear2.weight = torch.nn.Parameter(torch.tensor(parameters[3][0].T).float())
        self.linear2.bias = torch.nn.Parameter(torch.tensor(parameters[3][1]).float())
    self.softmax = nn.Softmax(dim=1)

`forward(self, feat_inputs)` ¶

PyTorch forward method used for training and prediction. It defines the interaction between layers.

Parameters:

Name	Type	Description	Default
`feat_inputs`	`numpy array`	It contains the network's input.	required

Returns:

Type	Description
`out (torch.tensor)`	Network's output

Source code in adviser/services/backchannel/PytorchAcousticBackchanneler.py

def forward(self, feat_inputs):
    """
    PyTorch forward method used for training and prediction. It defines the interaction between layers.
    Args:
        feat_inputs (numpy array): It contains the network's input.

    Returns:
        out (torch.tensor): Network's output
    """
    feat_inputs = torch.tensor(feat_inputs).float()
    feat_inputs = feat_inputs.unsqueeze(1)
    cnn_1 = self.cnn1(feat_inputs)
    cnn_1 = cnn_1.flatten(1)
    cnn_2 = self.cnn2(feat_inputs).flatten(1)
    out = torch.cat((cnn_1, cnn_2), 1)
    out = self.linear1(out)
    out = self.relu(out)
    out = self.dropout(out)
    out = self.linear2(out)
    out = self.softmax(out)
    return out

`acoustic_backchanneller` ¶

`gpu` ¶

`AcousticBackchanneller (Service)` ¶

AcousticBackchanneller predicts a backchannel given the last user utterance. The model can predict: No backchannel (0), Assessment (1), Continuer (2) The backchannel realization is added in the NLG module.

Source code in adviser/services/backchannel/acoustic_backchanneller.py

class AcousticBackchanneller(Service):
    """AcousticBackchanneller predicts a backchannel given the last user utterance.
       The model can predict: No backchannel (0), Assessment (1), Continuer (2)
       The backchannel realization is added in the NLG module.
    """

    def __init__(self):
        Service.__init__(self)
        self.speech_in_dir = os.path.dirname(os.path.abspath(__file__)) + '/'
        self.trained_model_path = os.path.join('resources', 'models', 'backchannel') + '/pytorch_acoustic_backchanneller.pt'
        self.load_model()

    def load_model(self):
        """
        The PyTorch Backchannel model is instantiated and the pretrained parameters are loaded.

        Returns:
        """
        self.model = PytorchAcousticBackchanneler()
        self.model.load_state_dict(torch.load(self.trained_model_path))
        self.model.eval()

    def split_input_data(self, mfcc_features):
        """
        Preprocess and segmentation of MFCC features of the user's speech.
        Segmentation is done every 150ms without overlapping.

        Args:
            mfcc_features (numpy.array): mffcc features of users speech

        Returns:
            new_data (list): segmented mfcc features

        """
        input_height = 150  # this stands for 150ms
        input_length = mfcc_features.shape[0]
        zero_shape = list(mfcc_features.shape)
        zero_shape[0] = input_height
        ranges = list(reversed([idx for idx in range(input_length - 1, 0, -input_height)]))
        new_data = []
        for r in ranges:
            if r < input_height:
                zero_data = np.zeros(zero_shape)
                zero_data[-r:, :] = mfcc_features[:r, :]
                new_data.append(zero_data)
            else:
                new_data.append(mfcc_features[r - input_height:r, :])
        return (new_data)

    @PublishSubscribe(sub_topics=['mfcc'],
                      pub_topics=["predicted_BC"])
    def backchannel_prediction(self, mfcc: np.array):
        """
        Service that receives the MFCC features from the user's speech.
        It preprocess and normalize them and makes the BC prediction.

        Args:
            mfcc_features (torch.tensor): MFCC features

        Returns:
            (dict): a dictionary with the key "predicted_BC" and the value of the BC type
        """
        # class_int_mapping = {0: b'no_bc', 1: b'assessment', 2: b'continuer'}
        mfcc_features = mfcc.numpy()
        scaler = preprocessing.StandardScaler()
        mfcc_features = scaler.fit_transform(mfcc_features)
        input_splits = self.split_input_data(mfcc_features)
        prediction = self.model(input_splits).detach().numpy().argmax(axis=1)

        # Returning the majority, unless a BC appears,
        if len(set(prediction)) == 1:
            return {'predicted_BC':  prediction[0]}
        elif 1 in prediction and 2 in prediction:
            ones = len(prediction[prediction==1])
            twos = len(prediction[prediction==2])
            return {'predicted_BC':  1 if ones > twos else 2}
        else:
            return {'predicted_BC': 1 if 1 in prediction else 2}

`init(self)` `special` ¶

Source code in adviser/services/backchannel/acoustic_backchanneller.py

def __init__(self):
    Service.__init__(self)
    self.speech_in_dir = os.path.dirname(os.path.abspath(__file__)) + '/'
    self.trained_model_path = os.path.join('resources', 'models', 'backchannel') + '/pytorch_acoustic_backchanneller.pt'
    self.load_model()

`backchannel_prediction(self, *args, **kwargs)` ¶

Source code in adviser/services/backchannel/acoustic_backchanneller.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`load_model(self)` ¶

The PyTorch Backchannel model is instantiated and the pretrained parameters are loaded.

Source code in adviser/services/backchannel/acoustic_backchanneller.py

def load_model(self):
    """
    The PyTorch Backchannel model is instantiated and the pretrained parameters are loaded.

    Returns:
    """
    self.model = PytorchAcousticBackchanneler()
    self.model.load_state_dict(torch.load(self.trained_model_path))
    self.model.eval()

`split_input_data(self, mfcc_features)` ¶

Preprocess and segmentation of MFCC features of the user's speech. Segmentation is done every 150ms without overlapping.

Parameters:

Name	Type	Description	Default
`mfcc_features`	`numpy.array`	mffcc features of users speech	required

Returns:

Type	Description
`new_data (list)`	segmented mfcc features

Source code in adviser/services/backchannel/acoustic_backchanneller.py

def split_input_data(self, mfcc_features):
    """
    Preprocess and segmentation of MFCC features of the user's speech.
    Segmentation is done every 150ms without overlapping.

    Args:
        mfcc_features (numpy.array): mffcc features of users speech

    Returns:
        new_data (list): segmented mfcc features

    """
    input_height = 150  # this stands for 150ms
    input_length = mfcc_features.shape[0]
    zero_shape = list(mfcc_features.shape)
    zero_shape[0] = input_height
    ranges = list(reversed([idx for idx in range(input_length - 1, 0, -input_height)]))
    new_data = []
    for r in ranges:
        if r < input_height:
            zero_data = np.zeros(zero_shape)
            zero_data[-r:, :] = mfcc_features[:r, :]
            new_data.append(zero_data)
        else:
            new_data.append(mfcc_features[r - input_height:r, :])
    return (new_data)

`bst` `special` ¶

`bst` ¶

`HandcraftedBST (Service)` ¶

A rule-based approach to belief state tracking.

Source code in adviser/services/bst/bst.py

class HandcraftedBST(Service):
    """
    A rule-based approach to belief state tracking.
    """

    def __init__(self, domain=None, logger=None):
        Service.__init__(self, domain=domain)
        self.logger = logger
        self.bs = BeliefState(domain)

    @PublishSubscribe(sub_topics=["user_acts"], pub_topics=["beliefstate"])
    def update_bst(self, user_acts: List[UserAct] = None) \
            -> dict(beliefstate=BeliefState):
        """
            Updates the current dialog belief state (which tracks the system's
            knowledge about what has been said in the dialog) based on the user actions generated
            from the user's utterances

            Args:
                user_acts (list): a list of UserAct objects mapped from the user's last utterance

            Returns:
                (dict): a dictionary with the key "beliefstate" and the value the updated
                        BeliefState object

        """
        # save last turn to memory
        self.bs.start_new_turn()
        if user_acts:
            self._reset_informs(user_acts)
            self._reset_requests()
            self.bs["user_acts"] = self._get_all_usr_action_types(user_acts)

            self._handle_user_acts(user_acts)

            num_entries, discriminable = self.bs.get_num_dbmatches()
            self.bs["num_matches"] = num_entries
            self.bs["discriminable"] = discriminable

        return {'beliefstate': self.bs}

    def dialog_start(self):
        """
            Restets the belief state so it is ready for a new dialog

            Returns:
                (dict): a dictionary with a single entry where the key is 'beliefstate'and
                        the value is a new BeliefState object
        """
        # initialize belief state
        self.bs = BeliefState(self.domain)

    def _reset_informs(self, acts: List[UserAct]):
        """
            If the user specifies a new value for a given slot, delete the old
            entry from the beliefstate
        """

        slots = {act.slot for act in acts if act.type == UserActionType.Inform}
        for slot in [s for s in self.bs['informs']]:
            if slot in slots:
                del self.bs['informs'][slot]

    def _reset_requests(self):
        """
            gets rid of requests from the previous turn
        """
        self.bs['requests'] = {}

    def _get_all_usr_action_types(self, user_acts: List[UserAct]) -> Set[UserActionType]:
        """ 
        Returns a set of all different UserActionTypes in user_acts.

        Args:
            user_acts (List[UserAct]): list of UserAct objects

        Returns:
            set of UserActionType objects
        """
        action_type_set = set()
        for act in user_acts:
            action_type_set.add(act.type)
        return action_type_set

    def _handle_user_acts(self, user_acts: List[UserAct]):

        """
            Updates the belief state based on the information contained in the user act(s)

            Args:
                user_acts (list[UserAct]): the list of user acts to use to update the belief state

        """

        # reset any offers if the user informs any new information
        if self.domain.get_primary_key() in self.bs['informs'] \
                and UserActionType.Inform in self.bs["user_acts"]:
            del self.bs['informs'][self.domain.get_primary_key()]

        # We choose to interpret switching as wanting to start a new dialog and do not support
        # resuming an old dialog
        elif UserActionType.SelectDomain in self.bs["user_acts"]:
            self.bs["informs"] = {}
            self.bs["requests"] = {}

        # Handle user acts
        for act in user_acts:
            if act.type == UserActionType.Request:
                self.bs['requests'][act.slot] = act.score
            elif act.type == UserActionType.Inform:
                # add informs and their scores to the beliefstate
                if act.slot in self.bs["informs"]:
                    self.bs['informs'][act.slot][act.value] = act.score
                else:
                    self.bs['informs'][act.slot] = {act.value: act.score}
            elif act.type == UserActionType.NegativeInform:
                # reset mentioned value to zero probability
                if act.slot in self.bs['informs']:
                    if act.value in self.bs['informs'][act.slot]:
                        del self.bs['informs'][act.slot][act.value]
            elif act.type == UserActionType.RequestAlternatives:
                # This way it is clear that the user is no longer asking about that one item
                if self.domain.get_primary_key() in self.bs['informs']:
                    del self.bs['informs'][self.domain.get_primary_key()]

`init(self, domain=None, logger=None)` `special` ¶

Source code in adviser/services/bst/bst.py

def __init__(self, domain=None, logger=None):
    Service.__init__(self, domain=domain)
    self.logger = logger
    self.bs = BeliefState(domain)

`dialog_start(self)` ¶

Restets the belief state so it is ready for a new dialog

Returns:

Type	Description
`(dict)`	a dictionary with a single entry where the key is 'beliefstate'and the value is a new BeliefState object

Source code in adviser/services/bst/bst.py

def dialog_start(self):
    """
        Restets the belief state so it is ready for a new dialog

        Returns:
            (dict): a dictionary with a single entry where the key is 'beliefstate'and
                    the value is a new BeliefState object
    """
    # initialize belief state
    self.bs = BeliefState(self.domain)

`update_bst(self, *args, **kwargs)` ¶

Source code in adviser/services/bst/bst.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`domain_tracker` `special` ¶

`domain_tracker` ¶

The console module provides ADVISER services for tracking current domain

`DomainTracker (Service)` ¶

Responsible for selecting which domain should be active at a given time. Current implmentation uses keywords to switch domains.

Source code in adviser/services/domain_tracker/domain_tracker.py

class DomainTracker(Service):
    """
        Responsible for selecting which domain should be active at a given time.
        Current implmentation uses keywords to switch domains.
    """

    def __init__(self, domains: List[Domain], greet_on_first_turn: bool = False):
        Service.__init__(self, domain="")
        self.domains = domains
        self.current_domain = None
        self.greet_on_first_turn = greet_on_first_turn

    def dialog_start(self):
        """
            Resets the domain tracker for the start of a new dialog
        """
        self.turn = 0
        self.current_domain = None

    @PublishSubscribe(sub_topics=["gen_user_utterance"], pub_topics=["user_utterance", "sys_utterance"])
    def select_domain(self, gen_user_utterance: str = None) -> dict(user_utterance=str):
        """
            Determines which domain should currently be active. In general, if a keyword is mentioned, the domain
            will change, otherwise it is assumed that the previous domain is still active.

            Args:
                gen_user_utterance (str): the user utterance, before a domain has been determined

            Returns:
                (dict): A dictionary with "user_utterane" as a key and a string as the value with the
                        selected domain appended to the end so the message can be properly routed.
        """

        self.turn += 1
        if self.turn == 1 and self.greet_on_first_turn:
            return {'sys_utterance': "Hello, please let me know how I can help you, I can discuss " +
                    f"the following domains: {self.domains_to_str()}."}

        # if there is only a single domain, simply route the message forward
        if len(self.domains) == 1:
            self.current_domain = self.domains[0]

        # make sure the utterance is lowercase if there is one
        user_utterance = gen_user_utterance
        if user_utterance:
            user_utterance = gen_user_utterance.strip().lower()

        # perform keyword matching to see if any domains are explicitely made active
        active_domains = [d for d in self.domains if d.get_keyword() in user_utterance]

        # Even if no domain has been specified, we should be able to exit
        if "bye" in user_utterance and not self.current_domain:
            return {"sys_utterance": "Thank you, goodbye."}

        # if there are active domains, use the first one
        elif active_domains:
            out_key = f"user_utterance/{active_domains[0].get_domain_name()}"
            self.current_domain = active_domains[0]
            return {out_key: user_utterance}

        # if no domain is explicitely mentioned, assume the last one is still active
        elif self.current_domain:
            out_key = f"user_utterance/{self.current_domain.get_domain_name()}"
            return {out_key: user_utterance}

        # Otherwise ask the user what domain they want
        else:
            return {"sys_utterance": "Hello, please let me know how I can help you, I can discuss " +
                    f"the following domains: {self.domains_to_str()}."}

    def domains_to_str(self):
        """
            Method to create the greeting on the first turn, grammatically joins the names of possible domains into
            a string

            Returns:
                (str): String representing a list of all domain names the system can talk about
        """
        if len(self.domains) == 1:
            return self.domains[0].get_display_name()
        elif len(self.domains) == 2:
            return " and ".join([d.get_display_name() for d in self.domains])
        else:
            return ", ".join([d.get_display_name() for d in self.domains][:-1]) + f", and {self.domains[-1].get_display_name()}"

`init(self, domains, greet_on_first_turn=False)` `special` ¶

Source code in adviser/services/domain_tracker/domain_tracker.py

def __init__(self, domains: List[Domain], greet_on_first_turn: bool = False):
    Service.__init__(self, domain="")
    self.domains = domains
    self.current_domain = None
    self.greet_on_first_turn = greet_on_first_turn

`dialog_start(self)` ¶

Resets the domain tracker for the start of a new dialog

Source code in adviser/services/domain_tracker/domain_tracker.py

def dialog_start(self):
    """
        Resets the domain tracker for the start of a new dialog
    """
    self.turn = 0
    self.current_domain = None

`domains_to_str(self)` ¶

Method to create the greeting on the first turn, grammatically joins the names of possible domains into a string

Returns:

Type	Description
`(str)`	String representing a list of all domain names the system can talk about

Source code in adviser/services/domain_tracker/domain_tracker.py

def domains_to_str(self):
    """
        Method to create the greeting on the first turn, grammatically joins the names of possible domains into
        a string

        Returns:
            (str): String representing a list of all domain names the system can talk about
    """
    if len(self.domains) == 1:
        return self.domains[0].get_display_name()
    elif len(self.domains) == 2:
        return " and ".join([d.get_display_name() for d in self.domains])
    else:
        return ", ".join([d.get_display_name() for d in self.domains][:-1]) + f", and {self.domains[-1].get_display_name()}"

`select_domain(self, *args, **kwargs)` ¶

Source code in adviser/services/domain_tracker/domain_tracker.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`emotion` `special` ¶

`EmotionRecognition` ¶

Emotion recognition module.

`EmotionRecognition (Service)` ¶

Emotion recognition module.

This module receives acoustic features, loads pretrained models and outputs predictions of emotional states. It can easily be extended/adapted to use different models and facial features in addition.

Source code in adviser/services/emotion/EmotionRecognition.py

class EmotionRecognition(Service):
    """Emotion recognition module.

    This module receives acoustic features, loads pretrained models and outputs
    predictions of emotional states. It can easily be extended/adapted to use
    different models and facial features in addition.
    """

    def __init__(self):
        """ Emotion recognition module.

        On initialization all necessary models are loaded.
        """
        Service.__init__(self)
        self.emotion_dir = os.path.dirname(os.path.abspath(__file__))
        self.model_path = os.path.abspath(
            os.path.join(
                self.emotion_dir, "..", "..", "resources", "models", "emotion"
            )
        )

        def load_args(emo_representation):
            arg_dict = pickle.load(
                open(os.path.join(
                    self.model_path, f'{emo_representation}_args.pkl'),
                     'rb')
            )
            return arg_dict

        def load_model(emo_representation, arg_dict):
            ARGS = arg_dict['args']
            model = cnn(
                kernel_size=(ARGS.height, arg_dict['D_in']),
                D_out=arg_dict['D_out'],
                args=ARGS
            )
            model.load_state_dict(
                torch.load(
                    os.path.join(self.model_path,
                                 f'{emo_representation}_model_params.pt'),
                    map_location=torch.device('cpu')
                )
            )
            model.eval()
            return model

        self.emo_representations = ['category', 'arousal', 'valence']
        self.models = {}
        self.args = {}
        for emo_representation in self.emo_representations:
            self.args[emo_representation] = load_args(emo_representation)
            self.models[emo_representation] = load_model(
                emo_representation,
                self.args[emo_representation]
            )
        self.arousal_mapping = {0: 'low', 1: 'medium', 2: 'high'}
        self.valence_mapping = {0: 'negative', 1: 'neutral', 2: 'positive'}
        self.category_mapping = {
            0: EmotionType.Angry,
            1: EmotionType.Happy,
            2: EmotionType.Neutral,
            3: EmotionType.Sad
        }

    @PublishSubscribe(sub_topics=["fbank"], pub_topics=["emotion"])
    def predict_from_audio(self, fbank):
        """Emotion prediction from acoustic features.

        Args:
            fbank (torch.Tensor): feature array, shape (sequence, num_mel_bins)

        Returns:
            dict: nested dictionary containing all results, main key: 'emotion'
        """

        def normalize_and_pad_features(features: torch.Tensor, seq_len, mean: torch.Tensor, std: torch.Tensor):
            # normalize
            features = (features - mean) / std
            # cut or pad with zeros as necessary
            features = torch.cat(
                [features[:seq_len],  # take feature data until :seq_len
                 features.new_zeros(  # pad with zeros if seq_len > feature.size(0)
                    (seq_len - features.size(0)) if seq_len > features.size(0) else 0,
                     features.size(1))],
                dim=0  # concatenate zeros in time dimension
            )
            return features

        predictions = {}
        for emo_representation in self.emo_representations:
            seq_len = self.args[emo_representation]['args'].seq_length
            mean = self.args[emo_representation]['norm_mean']
            std = self.args[emo_representation]['norm_std']
            # feature normalization and padding has to be done for each
            # emotion representation individually because the means and
            # standard (deviations) (and sequence length) can be different
            features = normalize_and_pad_features(fbank, seq_len, torch.from_numpy(mean), torch.from_numpy(std))
            predictions[emo_representation] = softmax(
                self.models[emo_representation](features.unsqueeze(1)), dim=1
            ).detach().numpy()

        arousal_level = self.arousal_mapping[np.argmax(predictions['arousal'])]
        valence_level = self.valence_mapping[np.argmax(predictions['valence'])]
        category_label = self.category_mapping[np.argmax(predictions['category'])]

        return {'emotion': {'arousal': arousal_level,
                            'valence': valence_level,
                            'category': category_label,
                            'cateogry_probabilities':
                                np.around(predictions['category'], 2).reshape(-1)}}

`init(self)` `special` ¶

Emotion recognition module.

On initialization all necessary models are loaded.

Source code in adviser/services/emotion/EmotionRecognition.py

def __init__(self):
    """ Emotion recognition module.

    On initialization all necessary models are loaded.
    """
    Service.__init__(self)
    self.emotion_dir = os.path.dirname(os.path.abspath(__file__))
    self.model_path = os.path.abspath(
        os.path.join(
            self.emotion_dir, "..", "..", "resources", "models", "emotion"
        )
    )

    def load_args(emo_representation):
        arg_dict = pickle.load(
            open(os.path.join(
                self.model_path, f'{emo_representation}_args.pkl'),
                 'rb')
        )
        return arg_dict

    def load_model(emo_representation, arg_dict):
        ARGS = arg_dict['args']
        model = cnn(
            kernel_size=(ARGS.height, arg_dict['D_in']),
            D_out=arg_dict['D_out'],
            args=ARGS
        )
        model.load_state_dict(
            torch.load(
                os.path.join(self.model_path,
                             f'{emo_representation}_model_params.pt'),
                map_location=torch.device('cpu')
            )
        )
        model.eval()
        return model

    self.emo_representations = ['category', 'arousal', 'valence']
    self.models = {}
    self.args = {}
    for emo_representation in self.emo_representations:
        self.args[emo_representation] = load_args(emo_representation)
        self.models[emo_representation] = load_model(
            emo_representation,
            self.args[emo_representation]
        )
    self.arousal_mapping = {0: 'low', 1: 'medium', 2: 'high'}
    self.valence_mapping = {0: 'negative', 1: 'neutral', 2: 'positive'}
    self.category_mapping = {
        0: EmotionType.Angry,
        1: EmotionType.Happy,
        2: EmotionType.Neutral,
        3: EmotionType.Sad
    }

`predict_from_audio(self, *args, **kwargs)` ¶

Source code in adviser/services/emotion/EmotionRecognition.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`engagement` `special` ¶

`engagement_tracker` ¶

`EngagementTracker (Service)` ¶

Start feature extraction with OpenFace. Requires OpenFace to be installed - instructions can be found in tool/openface.txt

Source code in adviser/services/engagement/engagement_tracker.py

class EngagementTracker(Service):
    """
    Start feature extraction with OpenFace.
    Requires OpenFace to be installed - instructions can be found in tool/openface.txt
    """
    def __init__(self, domain="", camera_id: int = 0, openface_port: int = 6004, delay: int = 2, identifier=None):
        """
        Args:
            camera_id: index of the camera you want to use (if you only have one camera: 0)
        """
        Service.__init__(self, domain="", identifier=identifier)
        self.camera_id = camera_id
        self.openface_port = openface_port
        self.openface_running = False
        self.threshold = delay   # provide number of seconds as parameter, one second = 15 frames

        ctx = Context.instance()
        self.openface_endpoint = ctx.socket(zmq.PAIR)
        self.openface_endpoint.bind(f"tcp://127.0.0.1:{self.openface_port}")

        startExtraction = f"{os.path.join(get_root_dir(), 'tools/OpenFace/build/bin/FaceLandmarkVidZMQ')} -device {self.camera_id} -port 6004"    # todo config open face port
        self.p_openface = subprocess.Popen(startExtraction.split(), stdout=subprocess.PIPE)	# start OpenFace
        self.extracting = False
        self.extractor_thread = None


    def dialog_start(self):
        # Set openface to publishing mode and wait until it is ready
        self.openface_endpoint.send(bytes(f"OPENFACE_START", encoding="ascii"))
        self.extracting = False
        while not self.extracting:
            msg = self.openface_endpoint.recv()    # receive started signal
            msg = msg.decode("utf-8")
            if msg == "OPENFACE_STARTED":
                print("START EXTRACTION")
                self.extracting = True
                self.extractor_thread = Thread(target=self.publish_gaze_directions)
                self.extractor_thread.start()


    @PublishSubscribe(pub_topics=["engagement", "gaze_direction"])
    def yield_gaze_direction(self, engagement: EngagementType, gaze_direction: Tuple[float, float]):
        """
        This is a helper function for the continuous publishing of engagement features.
        Call this function from a continuously running loop.

        Returns:
            engagement (EngagementType): high / low
            gaze_direction (float, float): tuple of gaze-x-angle and gaze-y-angle
        """
        return {"engagement": engagement, "gaze_direction": gaze_direction}


    def publish_gaze_directions(self):
        """
        Meant to be used in a thread.
        Runs an inifinte loop polling features from OpenFace library, parsing them and extracting engagement features.
        Calls `yield_gaze_direction` to publish the polled and processed engagement features.
        """

        x_coordinates=[]
        y_coordinates=[]

        norm = 0.0			# center point of screen; should be close(r) to 0
        looking = True

        while self.extracting:
            req = self.openface_endpoint.send(bytes(f"OPENFACE_PULL", encoding="ascii"))
            msg =  self.openface_endpoint.recv()
            try:
                msg = msg.decode("utf-8")
                if msg == "OPENFACE_ENDED":
                    self.extracting = False
                msg_data = json.loads(msg)

                gaze_x = msg_data["gaze"]["angle"]["x"]
                gaze_y = msg_data["gaze"]["angle"]["y"]

                gaze_x = sqrt(gaze_x**2)				# gaze_angle_x (left-right movement), square + root is done to yield only positive values
                gaze_y = sqrt(gaze_y**2)				# gaze_angle_y (up-down movement) 
                x_coordinates.append(gaze_x)
                y_coordinates.append(gaze_y)
                current = (len(x_coordinates))-1
                if current > self.threshold:
                    previous_x = mean(x_coordinates[current-(self.threshold+1):current])		# obtain the average of previous frames
                    previous_y = mean(y_coordinates[current-(self.threshold+1):current])
                    difference_x = sqrt((norm - previous_x)**2)					# compare current frame to average of previous frames
                    difference_y = sqrt((norm - previous_y)**2)
                    # print(difference_x, difference_y)
                    if difference_x < 0.15 and difference_y < 0.15:				# check whether difference between current and previous frames exceeds certain threshold (regulates tolerance/strictness)
                        if looking != True:
                            looking = True
                            self.yield_gaze_direction(engagement=EngagementType.High, gaze_direction=(gaze_x, gaze_y))
                    else:
                        if looking != False:
                            looking = False
                            self.yield_gaze_direction(engagement=EngagementType.Low, gaze_direction=(gaze_x, gaze_y))
            except:
                # import traceback
                # traceback.print_exc()
                pass

    def dialog_end(self):
        # Set openface to non-publishing mode and wait until it is ready
        self.openface_endpoint.send(bytes(f"OPENFACE_END", encoding="ascii"))
        if self.extractor_thread:
            self.extractor_thread.join()

    def dialog_exit(self):
        # close openface process
        self.p_openface.kill()

`init(self, domain='', camera_id=0, openface_port=6004, delay=2, identifier=None)` `special` ¶

Parameters:

Name	Type	Description	Default
`camera_id`	`int`	index of the camera you want to use (if you only have one camera: 0)	`0`

Source code in adviser/services/engagement/engagement_tracker.py

def __init__(self, domain="", camera_id: int = 0, openface_port: int = 6004, delay: int = 2, identifier=None):
    """
    Args:
        camera_id: index of the camera you want to use (if you only have one camera: 0)
    """
    Service.__init__(self, domain="", identifier=identifier)
    self.camera_id = camera_id
    self.openface_port = openface_port
    self.openface_running = False
    self.threshold = delay   # provide number of seconds as parameter, one second = 15 frames

    ctx = Context.instance()
    self.openface_endpoint = ctx.socket(zmq.PAIR)
    self.openface_endpoint.bind(f"tcp://127.0.0.1:{self.openface_port}")

    startExtraction = f"{os.path.join(get_root_dir(), 'tools/OpenFace/build/bin/FaceLandmarkVidZMQ')} -device {self.camera_id} -port 6004"    # todo config open face port
    self.p_openface = subprocess.Popen(startExtraction.split(), stdout=subprocess.PIPE)	# start OpenFace
    self.extracting = False
    self.extractor_thread = None

`dialog_end(self)` ¶

This function is called after a dialog ended (Topics.DIALOG_END message was received). You should overwrite this function to record dialog-level information.

Source code in adviser/services/engagement/engagement_tracker.py

def dialog_end(self):
    # Set openface to non-publishing mode and wait until it is ready
    self.openface_endpoint.send(bytes(f"OPENFACE_END", encoding="ascii"))
    if self.extractor_thread:
        self.extractor_thread.join()

`dialog_exit(self)` ¶

This function is called when the dialog system is shutting down. You should overwrite this function to stop your threads and cleanup any open resources.

Source code in adviser/services/engagement/engagement_tracker.py

def dialog_exit(self):
    # close openface process
    self.p_openface.kill()

`dialog_start(self)` ¶

This function is called before the first message to a new dialog is published. You should overwrite this function to set/reset dialog-level variables.

Source code in adviser/services/engagement/engagement_tracker.py

def dialog_start(self):
    # Set openface to publishing mode and wait until it is ready
    self.openface_endpoint.send(bytes(f"OPENFACE_START", encoding="ascii"))
    self.extracting = False
    while not self.extracting:
        msg = self.openface_endpoint.recv()    # receive started signal
        msg = msg.decode("utf-8")
        if msg == "OPENFACE_STARTED":
            print("START EXTRACTION")
            self.extracting = True
            self.extractor_thread = Thread(target=self.publish_gaze_directions)
            self.extractor_thread.start()

`publish_gaze_directions(self)` ¶

Meant to be used in a thread. Runs an inifinte loop polling features from OpenFace library, parsing them and extracting engagement features. Calls yield_gaze_direction to publish the polled and processed engagement features.

Source code in adviser/services/engagement/engagement_tracker.py

def publish_gaze_directions(self):
    """
    Meant to be used in a thread.
    Runs an inifinte loop polling features from OpenFace library, parsing them and extracting engagement features.
    Calls `yield_gaze_direction` to publish the polled and processed engagement features.
    """

    x_coordinates=[]
    y_coordinates=[]

    norm = 0.0			# center point of screen; should be close(r) to 0
    looking = True

    while self.extracting:
        req = self.openface_endpoint.send(bytes(f"OPENFACE_PULL", encoding="ascii"))
        msg =  self.openface_endpoint.recv()
        try:
            msg = msg.decode("utf-8")
            if msg == "OPENFACE_ENDED":
                self.extracting = False
            msg_data = json.loads(msg)

            gaze_x = msg_data["gaze"]["angle"]["x"]
            gaze_y = msg_data["gaze"]["angle"]["y"]

            gaze_x = sqrt(gaze_x**2)				# gaze_angle_x (left-right movement), square + root is done to yield only positive values
            gaze_y = sqrt(gaze_y**2)				# gaze_angle_y (up-down movement) 
            x_coordinates.append(gaze_x)
            y_coordinates.append(gaze_y)
            current = (len(x_coordinates))-1
            if current > self.threshold:
                previous_x = mean(x_coordinates[current-(self.threshold+1):current])		# obtain the average of previous frames
                previous_y = mean(y_coordinates[current-(self.threshold+1):current])
                difference_x = sqrt((norm - previous_x)**2)					# compare current frame to average of previous frames
                difference_y = sqrt((norm - previous_y)**2)
                # print(difference_x, difference_y)
                if difference_x < 0.15 and difference_y < 0.15:				# check whether difference between current and previous frames exceeds certain threshold (regulates tolerance/strictness)
                    if looking != True:
                        looking = True
                        self.yield_gaze_direction(engagement=EngagementType.High, gaze_direction=(gaze_x, gaze_y))
                else:
                    if looking != False:
                        looking = False
                        self.yield_gaze_direction(engagement=EngagementType.Low, gaze_direction=(gaze_x, gaze_y))
        except:
            # import traceback
            # traceback.print_exc()
            pass

`yield_gaze_direction(self, *args, **kwargs)` ¶

Source code in adviser/services/engagement/engagement_tracker.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`get_root_dir()` ¶

Source code in adviser/services/engagement/engagement_tracker.py

def get_root_dir():
    return os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

`hci` `special` ¶

`all` `special` ¶

`console` ¶

The console module provides ADVISER modules that access the console for input and output.

`ConsoleInput (Service)` ¶

Gets the user utterance from the console.

Waits for the built-in input function to return a non-empty text.

Source code in adviser/services/hci/console.py

class ConsoleInput(Service):
    """
    Gets the user utterance from the console.

    Waits for the built-in input function to return a non-empty text.
    """

    def __init__(self, domain: Domain = None, conversation_log_dir: str = None, language: Language = None):
        Service.__init__(self, domain=domain)
        # self.language = language
        self.language = Language.ENGLISH
        self.conversation_log_dir = conversation_log_dir
        self.interaction_count = 0
        # if self.language is None:
        #     self.language = self._set_language()

    def dialog_start(self):
        self.interaction_count = 0

    @PublishSubscribe(sub_topics=[Topic.DIALOG_END], pub_topics=["gen_user_utterance"])
    def get_user_input(self, dialog_end: bool = True) -> dict(user_utterance=str):
        """

        If this function has not been called before, do not pass a message.
        Otherwise, it blocks the application until the user has entered a
        valid (i.e. non-empty) message in the console.

        Returns:
            dict: a dict containing the user utterance
        """
        if dialog_end:
            return

        utterance = self._input()
        # write into logging directory
        if self.conversation_log_dir is not None:
            with open(os.path.join(self.conversation_log_dir, (str(math.floor(time.time())) + "_user.txt")),
                      "w") as convo_log:
                convo_log.write(utterance)
        return {'gen_user_utterance': utterance}

    def _input(self):
        "Helper function for reading text input from the console"
        utterance = ''
        try:
            sys.stdout.write('>>> ')
            sys.stdout.flush()
            line = sys.stdin.readline()
            while line.strip() == '' and not getattr(self, '_dialog_system_parent').terminating():
                line = sys.stdin.readline()
            utterance = line
            if getattr(self, '_dialog_system_parent').terminating():
                sys.stdin.close()
            return utterance
        except:
            return utterance

    def _set_language(self) -> Language:
        """
            asks the user to select the language of the system, returning the enum
            representing their preference, or None if they don't give a recognized
            input
        """
        utterance = ""
        print("Please select your language: English or German")
        while utterance.strip() == "":
            utterance = input(">>> ")
        utterance = utterance.lower()
        if utterance == 'e' or utterance == 'english':
            return Language.ENGLISH
        elif utterance == 'g' or utterance == 'german' or utterance == 'deutsch' \
                or utterance == 'd':
            return Language.GERMAN
        else:
            return None

`init(self, domain=None, conversation_log_dir=None, language=None)` `special` ¶

Source code in adviser/services/hci/console.py

def __init__(self, domain: Domain = None, conversation_log_dir: str = None, language: Language = None):
    Service.__init__(self, domain=domain)
    # self.language = language
    self.language = Language.ENGLISH
    self.conversation_log_dir = conversation_log_dir
    self.interaction_count = 0
    # if self.language is None:
    #     self.language = self._set_language()

`dialog_start(self)` ¶

This function is called before the first message to a new dialog is published. You should overwrite this function to set/reset dialog-level variables.

Source code in adviser/services/hci/console.py

def dialog_start(self):
    self.interaction_count = 0

`get_user_input(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/console.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`ConsoleOutput (Service)` ¶

Writes the system utterance to the console.

Source code in adviser/services/hci/console.py

class ConsoleOutput(Service):
    """Writes the system utterance to the console."""

    def __init__(self, domain: Domain = None):
        Service.__init__(self, domain=domain)

    @PublishSubscribe(sub_topics=["sys_utterance"], pub_topics=[Topic.DIALOG_END])
    def print_sys_utterance(self, sys_utterance: str = None) -> dict():
        """

        The message is simply printed to the console.

        Args:
            sys_utterance (str): The system utterance

        Returns:
            dict with entry dialog_end: True or False

        Raises:
            ValueError: if there is no system utterance to print
        """
        if sys_utterance is not None and sys_utterance != "":
            print("System: {}".format(sys_utterance))
        else:
            raise ValueError("There is no system utterance. Did you forget to call an NLG module before?")

        return {Topic.DIALOG_END: 'bye' in sys_utterance}

`init(self, domain=None)` `special` ¶

Source code in adviser/services/hci/console.py

def __init__(self, domain: Domain = None):
    Service.__init__(self, domain=domain)

`print_sys_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/console.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`gui` ¶

`GUIServer (Service)` ¶

Source code in adviser/services/hci/gui.py

class GUIServer(Service):
    def __init__(self, logger=None):
        super().__init__(domain="", identifier="GUIServer")
        self.websocket = None
        self.loopy_loop = asyncio.new_event_loop()
        # open UI in webbrowser automatically
        webui_path = f"file:///{os.path.join(os.path.realpath(''), 'tools', 'webui', 'chat.html')}"
        print("WEBUI accessible at", webui_path)
        webbrowser.open(webui_path)

    @PublishSubscribe(pub_topics=['gen_user_utterance'])
    def user_utterance(self, message = ""):
        return {'gen_user_utterance': message}

    @PublishSubscribe(sub_topics=['sys_utterance'])
    def forward_sys_utterance(self, sys_utterance: str):
        self.forward_message_to_react(message=sys_utterance, topic="sys_utterance")

    def forward_message_to_react(self, message, topic: str):
        asyncio.set_event_loop(self.loopy_loop)
        if self.websocket:
            self.websocket.write_message({"topic": topic, "msg": message})

`init(self, logger=None)` `special` ¶

Source code in adviser/services/hci/gui.py

def __init__(self, logger=None):
    super().__init__(domain="", identifier="GUIServer")
    self.websocket = None
    self.loopy_loop = asyncio.new_event_loop()
    # open UI in webbrowser automatically
    webui_path = f"file:///{os.path.join(os.path.realpath(''), 'tools', 'webui', 'chat.html')}"
    print("WEBUI accessible at", webui_path)
    webbrowser.open(webui_path)

`forward_message_to_react(self, message, topic)` ¶

Source code in adviser/services/hci/gui.py

def forward_message_to_react(self, message, topic: str):
    asyncio.set_event_loop(self.loopy_loop)
    if self.websocket:
        self.websocket.write_message({"topic": topic, "msg": message})

`forward_sys_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/gui.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`user_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/gui.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`speech` `special` ¶

`SpeechInputDecoder` ¶

`SpeechInputDecoder (Service)` ¶

Source code in adviser/services/hci/speech/SpeechInputDecoder.py

class SpeechInputDecoder(Service):

    def __init__(self, domain: Domain = "", identifier=None, conversation_log_dir: str = None, use_cuda=False):
        """
        Transforms spoken input from the user to text for further processing.

        Args:
            domain (Domain): Needed for Service, but has no meaning here
            identifier (string): Needed for Service
            conversation_log_dir (string): If this is provided, logfiles will be placed by this Service into the specified directory.
            use_cuda (boolean): Whether or not to run the computations on a GPU
        """
        Service.__init__(self, domain=domain, identifier=identifier)
        self.conversation_log_dir = conversation_log_dir

        # load model
        model_dir = os.path.join(get_root_dir(), "resources", "models", "speech", "multi_en_20190916")
        self.model, conf = load_trained_model(os.path.join(model_dir, "model.bin"))
        self.vocab = conf.char_list

        # setup beam search
        self.bs = BeamSearch(scorers=self.model.scorers(),
                             weights={"decoder": 1.0, "ctc": 0.0},
                             sos=self.model.sos,
                             eos=self.model.eos,
                             beam_size=4,
                             vocab_size=len(self.vocab),
                             pre_beam_score_key="decoder")

        self.bs.__class__ = BatchBeamSearch

        # choose hardware to run on
        if use_cuda:
            self.device = "cuda"
        else:
            self.device = "cpu"

        self.model.to(self.device)
        self.bs.to(self.device)

        # change from training mode to eval mode
        self.model.eval()
        self.bs.eval()

        # scale and offset for feature normalization
        # follows https://github.com/kaldi-asr/kaldi/blob/33255ed224500f55c8387f1e4fa40e08b73ff48a/src/transform/cmvn.cc#L92-L111
        norm = torch.load(os.path.join(model_dir, "cmvn.bin"))
        count = norm[0][-1]
        mean = norm[0][:-1] / count
        var = (norm[1][:-1] / count) - mean * mean
        self.scale = 1.0 / torch.sqrt(var)
        self.offset = - (mean * self.scale)

    @PublishSubscribe(sub_topics=["speech_features"], pub_topics=["gen_user_utterance"])
    def features_to_text(self, speech_features):
        """
        Turns features of the utterance into a string and returns the user utterance in form of text

        Args:
            speech_features (np.array): The features that the speech feature extraction module produces

        Returns:
            dict(string, string): The user utterance as text
        """
        speech_in_features_normalized = torch.from_numpy(speech_features) * self.scale + self.offset
        with torch.no_grad():
            encoded = self.model.encode(speech_in_features_normalized.to(self.device))
            result = self.bs.forward(encoded)

        # We only consider the most probable hypothesis.
        # Language Model could improve this, right now we don't use one.
        # This might need some post-processing...
        user_utterance = "".join(self.vocab[y] for y in result[0].yseq) \
            .replace("▁", " ") \
            .replace("<space>", " ") \
            .replace("<eos>", "") \
            .strip()

        # write decoded text into logging directory
        if self.conversation_log_dir is not None:
            with open(os.path.join(self.conversation_log_dir, (str(np.math.floor(time.time())) + "_user.txt")),
                      "w") as convo_log:
                convo_log.write(user_utterance)

        print("User: {}\n".format(user_utterance))

        return {'gen_user_utterance': user_utterance}

`init(self, domain='', identifier=None, conversation_log_dir=None, use_cuda=False)` `special` ¶

Transforms spoken input from the user to text for further processing.

Parameters:

Name	Type	Description	Default
`domain`	`Domain`	Needed for Service, but has no meaning here	`''`
`identifier`	`string`	Needed for Service	`None`
`conversation_log_dir`	`string`	If this is provided, logfiles will be placed by this Service into the specified directory.	`None`
`use_cuda`	`boolean`	Whether or not to run the computations on a GPU	`False`

Source code in adviser/services/hci/speech/SpeechInputDecoder.py

def __init__(self, domain: Domain = "", identifier=None, conversation_log_dir: str = None, use_cuda=False):
    """
    Transforms spoken input from the user to text for further processing.

    Args:
        domain (Domain): Needed for Service, but has no meaning here
        identifier (string): Needed for Service
        conversation_log_dir (string): If this is provided, logfiles will be placed by this Service into the specified directory.
        use_cuda (boolean): Whether or not to run the computations on a GPU
    """
    Service.__init__(self, domain=domain, identifier=identifier)
    self.conversation_log_dir = conversation_log_dir

    # load model
    model_dir = os.path.join(get_root_dir(), "resources", "models", "speech", "multi_en_20190916")
    self.model, conf = load_trained_model(os.path.join(model_dir, "model.bin"))
    self.vocab = conf.char_list

    # setup beam search
    self.bs = BeamSearch(scorers=self.model.scorers(),
                         weights={"decoder": 1.0, "ctc": 0.0},
                         sos=self.model.sos,
                         eos=self.model.eos,
                         beam_size=4,
                         vocab_size=len(self.vocab),
                         pre_beam_score_key="decoder")

    self.bs.__class__ = BatchBeamSearch

    # choose hardware to run on
    if use_cuda:
        self.device = "cuda"
    else:
        self.device = "cpu"

    self.model.to(self.device)
    self.bs.to(self.device)

    # change from training mode to eval mode
    self.model.eval()
    self.bs.eval()

    # scale and offset for feature normalization
    # follows https://github.com/kaldi-asr/kaldi/blob/33255ed224500f55c8387f1e4fa40e08b73ff48a/src/transform/cmvn.cc#L92-L111
    norm = torch.load(os.path.join(model_dir, "cmvn.bin"))
    count = norm[0][-1]
    mean = norm[0][:-1] / count
    var = (norm[1][:-1] / count) - mean * mean
    self.scale = 1.0 / torch.sqrt(var)
    self.offset = - (mean * self.scale)

`features_to_text(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechInputDecoder.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`get_root_dir()` ¶

Source code in adviser/services/hci/speech/SpeechInputDecoder.py

def get_root_dir():
    return os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

`SpeechInputFeatureExtractor` ¶

`SpeechInputFeatureExtractor (Service)` ¶

Source code in adviser/services/hci/speech/SpeechInputFeatureExtractor.py

class SpeechInputFeatureExtractor(Service):

    def __init__(self, domain: Domain = ""):
        """
        Given a sound, this service extracts features and passes them on to the decoder for ASR

        Args:
            domain (Domain): Needed for Service, no meaning here
        """
        Service.__init__(self, domain=domain)

    @PublishSubscribe(sub_topics=["speech_in"], pub_topics=["speech_features"])
    def speech_to_features(self, speech_in: Tuple[numpy.array, int]):
        """
        Turns numpy array with utterance into features

        Args:
            speech_in (tuple(np.array), int): The utterance, represented as array and the sampling rate

        Returns:
            np.array: The extracted features of the utterance
        """
        sample_frequence = speech_in[1]
        speech_in = torch.from_numpy(speech_in[0]).unsqueeze(0)

        filter_bank = torchaudio.compliance.kaldi.fbank(speech_in, num_mel_bins=80, sample_frequency=sample_frequence)
        # Default ASR model uses 16kHz, but different models are possible, then the sampling rate only needs to be changd in the recorder
        pitch = torch.zeros(filter_bank.shape[0], 3)  # TODO: check if torchaudio pitch function is better
        speech_in_features = torch.cat([filter_bank, pitch], 1).numpy()

        return {'speech_features': speech_in_features}

    @PublishSubscribe(sub_topics=["speech_in"], pub_topics=["mfcc"])
    def speech_to_mfcc(self, speech_in):
        """
        Extracts 13 Mel Frequency Cepstral Coefficients (MFCC) from input utterance.

        Args:
            speech_in (tuple(np.array), int): The utterance, represented as array and the sampling rate

        Returns:
            np.array: The extracted features of the utterance
        """
        speech = torch.from_numpy(speech_in[0]).unsqueeze(0)
        mfcc = torchaudio.compliance.kaldi.mfcc(
            speech,
            sample_frequency=speech_in[1]
        )
        return {'mfcc': mfcc}

    @PublishSubscribe(sub_topics=["speech_in"], pub_topics=["fbank"])
    def speech_to_fbank(self, speech_in):
        """
        Extracts 23 filterbanks from input utterance.

        Args:
            speech_in (tuple(np.array), int): The utterance, represented as array and the sampling rate

        Returns:
            np.array: The extracted features of the utterance
        """
        speech = torch.from_numpy(speech_in[0]).unsqueeze(0)
        fbank = torchaudio.compliance.kaldi.fbank(
            speech,
            sample_frequency=speech_in[1]
        )
        return {'fbank': fbank}

`init(self, domain='')` `special` ¶

Given a sound, this service extracts features and passes them on to the decoder for ASR

Parameters:

Name	Type	Description	Default
`domain`	`Domain`	Needed for Service, no meaning here	`''`

Source code in adviser/services/hci/speech/SpeechInputFeatureExtractor.py

def __init__(self, domain: Domain = ""):
    """
    Given a sound, this service extracts features and passes them on to the decoder for ASR

    Args:
        domain (Domain): Needed for Service, no meaning here
    """
    Service.__init__(self, domain=domain)

`speech_to_fbank(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechInputFeatureExtractor.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`speech_to_features(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechInputFeatureExtractor.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`speech_to_mfcc(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechInputFeatureExtractor.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`SpeechOutputGenerator` ¶

`SpeechOutputGenerator (Service)` ¶

Source code in adviser/services/hci/speech/SpeechOutputGenerator.py

class SpeechOutputGenerator(Service):

    def __init__(self, domain: Domain = "", identifier: str = None, use_cuda=False, sub_topic_domains: Dict[str, str] = {}):
        """
        Text To Speech Module that reads out the system utterance.

        Args:
            domain (Domain): Needed for Service, no meaning here
            identifier (string): Needed for Service
            use_cuda (boolean): Whether or not to perform computations on GPU. Highly recommended if available
            sub_topic_domains: see `services.service.Service` constructor for more details
        """
        Service.__init__(self, domain=domain, identifier=identifier, sub_topic_domains=sub_topic_domains)
        self.models_directory = os.path.join(get_root_dir(), "resources", "models", "speech")

        # The following lines can be changed to incorporate different models.
        # This is the only thing that needs to be changed for that, everything else should be dynamic.
        self.transcription_type = "phn"
        self.dict_path = os.path.join(self.models_directory,
                                      "phn_train_no_dev_pytorch_train_fastspeech.v4", "data", "lang_1phn",
                                      "train_no_dev_units.txt")
        self.model_path = os.path.join(self.models_directory,
                                       "phn_train_no_dev_pytorch_train_fastspeech.v4", "exp",
                                       "phn_train_no_dev_pytorch_train_fastspeech.v4", "results",
                                       "model.last1.avg.best")
        self.vocoder_path = os.path.join(self.models_directory,
                                         "ljspeech.parallel_wavegan.v1", "checkpoint-400000steps.pkl")
        self.vocoder_conf = os.path.join(self.models_directory, "ljspeech.parallel_wavegan.v1", "config.yml")

        # define device to run the synthesis on
        if use_cuda:
            self.device = torch.device("cuda")
        else:
            self.device = torch.device("cpu")

        # define end to end TTS model
        self.input_dimensions, self.output_dimensions, self.train_args = get_model_conf(self.model_path)
        model_class = dynamic_import.dynamic_import(self.train_args.model_module)
        model = model_class(self.input_dimensions, self.output_dimensions, self.train_args)
        torch_load(self.model_path, model)
        self.model = model.eval().to(self.device)
        self.inference_args = Namespace(**{"threshold": 0.5, "minlenratio": 0.0, "maxlenratio": 10.0})

        # define neural vocoder
        with open(self.vocoder_conf) as vocoder_config_file:
            self.config = yaml.load(vocoder_config_file, Loader=yaml.Loader)
        vocoder = ParallelWaveGANGenerator(**self.config["generator_params"])
        vocoder.load_state_dict(torch.load(self.vocoder_path, map_location="cpu")["model"]["generator"])
        vocoder.remove_weight_norm()
        self.vocoder = vocoder.eval().to(self.device)

        with open(self.dict_path) as dictionary_file:
            lines = dictionary_file.readlines()
        lines = [line.replace("\n", "").split(" ") for line in lines]
        self.char_to_id = {c: int(i) for c, i in lines}
        self.g2p = G2p()

        # download the pretrained Punkt tokenizer from NLTK. This is done only
        # the first time the code is executed on a machine, if it has been done
        # before, this line will be skipped and output a warning. We will probably
        # redirect warnings into a file rather than std_err in the future, since
        # there's also a lot of pytorch warnings going on etc.
        nltk.download('punkt', quiet=True)

    def preprocess_text_input(self, text):
        """
        Clean the text and then convert it to id sequence.

        Args:
            text (string): The text to preprocess
        """
        text = custom_english_cleaners(text)  # cleans the text
        if self.transcription_type == "phn":  # depending on the model type, different preprocessing is needed.
            text = filter(lambda s: s != " ", self.g2p(text))
            text = " ".join(text)
            char_sequence = text.split(" ")
        else:
            char_sequence = list(text)
        id_sequence = []
        for c in char_sequence:
            if c.isspace():
                id_sequence += [self.char_to_id["<space>"]]
            elif c not in self.char_to_id.keys():
                id_sequence += [self.char_to_id["<unk>"]]
            else:
                id_sequence += [self.char_to_id[c]]
        id_sequence += [self.input_dimensions - 1]  # <eos>
        return torch.LongTensor(id_sequence).view(-1).to(self.device)

    @PublishSubscribe(sub_topics=["sys_utterance"], pub_topics=["system_speech"])
    def generate_speech(self, sys_utterance):
        """
        Takes the system utterance and turns it into a sound

        Args:
            sys_utterance (string): The new system utterance

        Returns:
            dict(string, tuple(np.array, int, string)): Everything needed to play the system utterance as an audio and the utterance in text for logging
        """
        with torch.no_grad():
            preprocessed_text_as_list = self.preprocess_text_input(sys_utterance)
            features_from_text, _, _ = self.model.inference(preprocessed_text_as_list, self.inference_args)
            feature_dimension = features_from_text.size(0) * self.config["hop_size"]
            random_tensor_with_proper_dimensions = torch.randn(1, 1, feature_dimension).to(self.device)
            auxiliary_content_window = self.config["generator_params"]["aux_context_window"]
            preprocessed_features = features_from_text.unsqueeze(0).transpose(2, 1)
            features_from_text = torch.nn.ReplicationPad1d(auxiliary_content_window)(preprocessed_features)
            generated_speech = self.vocoder(random_tensor_with_proper_dimensions, features_from_text).view(-1)
            sound_as_array = generated_speech.view(-1).cpu().numpy()
        return {"system_speech": (sound_as_array, self.config["sampling_rate"], sys_utterance)}

`init(self, domain='', identifier=None, use_cuda=False, sub_topic_domains={})` `special` ¶

Text To Speech Module that reads out the system utterance.

Parameters:

Name	Type	Description	Default
`domain`	`Domain`	Needed for Service, no meaning here	`''`
`identifier`	`string`	Needed for Service	`None`
`use_cuda`	`boolean`	Whether or not to perform computations on GPU. Highly recommended if available	`False`
`sub_topic_domains`	`Dict[str, str]`	see `services.service.Service` constructor for more details	`{}`

Source code in adviser/services/hci/speech/SpeechOutputGenerator.py

def __init__(self, domain: Domain = "", identifier: str = None, use_cuda=False, sub_topic_domains: Dict[str, str] = {}):
    """
    Text To Speech Module that reads out the system utterance.

    Args:
        domain (Domain): Needed for Service, no meaning here
        identifier (string): Needed for Service
        use_cuda (boolean): Whether or not to perform computations on GPU. Highly recommended if available
        sub_topic_domains: see `services.service.Service` constructor for more details
    """
    Service.__init__(self, domain=domain, identifier=identifier, sub_topic_domains=sub_topic_domains)
    self.models_directory = os.path.join(get_root_dir(), "resources", "models", "speech")

    # The following lines can be changed to incorporate different models.
    # This is the only thing that needs to be changed for that, everything else should be dynamic.
    self.transcription_type = "phn"
    self.dict_path = os.path.join(self.models_directory,
                                  "phn_train_no_dev_pytorch_train_fastspeech.v4", "data", "lang_1phn",
                                  "train_no_dev_units.txt")
    self.model_path = os.path.join(self.models_directory,
                                   "phn_train_no_dev_pytorch_train_fastspeech.v4", "exp",
                                   "phn_train_no_dev_pytorch_train_fastspeech.v4", "results",
                                   "model.last1.avg.best")
    self.vocoder_path = os.path.join(self.models_directory,
                                     "ljspeech.parallel_wavegan.v1", "checkpoint-400000steps.pkl")
    self.vocoder_conf = os.path.join(self.models_directory, "ljspeech.parallel_wavegan.v1", "config.yml")

    # define device to run the synthesis on
    if use_cuda:
        self.device = torch.device("cuda")
    else:
        self.device = torch.device("cpu")

    # define end to end TTS model
    self.input_dimensions, self.output_dimensions, self.train_args = get_model_conf(self.model_path)
    model_class = dynamic_import.dynamic_import(self.train_args.model_module)
    model = model_class(self.input_dimensions, self.output_dimensions, self.train_args)
    torch_load(self.model_path, model)
    self.model = model.eval().to(self.device)
    self.inference_args = Namespace(**{"threshold": 0.5, "minlenratio": 0.0, "maxlenratio": 10.0})

    # define neural vocoder
    with open(self.vocoder_conf) as vocoder_config_file:
        self.config = yaml.load(vocoder_config_file, Loader=yaml.Loader)
    vocoder = ParallelWaveGANGenerator(**self.config["generator_params"])
    vocoder.load_state_dict(torch.load(self.vocoder_path, map_location="cpu")["model"]["generator"])
    vocoder.remove_weight_norm()
    self.vocoder = vocoder.eval().to(self.device)

    with open(self.dict_path) as dictionary_file:
        lines = dictionary_file.readlines()
    lines = [line.replace("\n", "").split(" ") for line in lines]
    self.char_to_id = {c: int(i) for c, i in lines}
    self.g2p = G2p()

    # download the pretrained Punkt tokenizer from NLTK. This is done only
    # the first time the code is executed on a machine, if it has been done
    # before, this line will be skipped and output a warning. We will probably
    # redirect warnings into a file rather than std_err in the future, since
    # there's also a lot of pytorch warnings going on etc.
    nltk.download('punkt', quiet=True)

`generate_speech(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechOutputGenerator.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`preprocess_text_input(self, text)` ¶

Clean the text and then convert it to id sequence.

Parameters:

Name	Type	Description	Default
`text`	`string`	The text to preprocess	required

Source code in adviser/services/hci/speech/SpeechOutputGenerator.py

def preprocess_text_input(self, text):
    """
    Clean the text and then convert it to id sequence.

    Args:
        text (string): The text to preprocess
    """
    text = custom_english_cleaners(text)  # cleans the text
    if self.transcription_type == "phn":  # depending on the model type, different preprocessing is needed.
        text = filter(lambda s: s != " ", self.g2p(text))
        text = " ".join(text)
        char_sequence = text.split(" ")
    else:
        char_sequence = list(text)
    id_sequence = []
    for c in char_sequence:
        if c.isspace():
            id_sequence += [self.char_to_id["<space>"]]
        elif c not in self.char_to_id.keys():
            id_sequence += [self.char_to_id["<unk>"]]
        else:
            id_sequence += [self.char_to_id[c]]
    id_sequence += [self.input_dimensions - 1]  # <eos>
    return torch.LongTensor(id_sequence).view(-1).to(self.device)

`get_root_dir()` ¶

Source code in adviser/services/hci/speech/SpeechOutputGenerator.py

def get_root_dir():
    return os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

`SpeechOutputPlayer` ¶

`SpeechOutputPlayer (Service)` ¶

Source code in adviser/services/hci/speech/SpeechOutputPlayer.py

class SpeechOutputPlayer(Service):

    def __init__(self, domain: Domain = "", conversation_log_dir: str = None, identifier: str = None):
        """
        Service that plays the system utterance as sound

        Args:
            domain (Domain): Needed for Service, but has no meaning here
            conversation_log_dir (string): If this is provided it will create log files in the specified directory.
            identifier (string): Needed for Service.
        """
        Service.__init__(self, domain=domain, identifier=identifier)
        self.conversation_log_dir = conversation_log_dir
        self.interaction_count = 0

    @PublishSubscribe(sub_topics=["system_speech"], pub_topics=[])
    def speak(self, system_speech):
        """
        Takes the system utterance and reads it out. Also can log the audio and text.

        Args:
            system_speech (np.array): An array of audio that is meant to produce a sound from. The result of the systems TTS synthesis service.
        """
        sounddevice.play(system_speech[0], system_speech[1])

        # log the utterance
        if self.conversation_log_dir is not None:
            file_path = os.path.join(self.conversation_log_dir, (str(math.floor(time.time()))))
            sf.write(file_path + "_system.wav", system_speech[0], system_speech[1], 'PCM_24')
            with open(file_path + "_system.txt", "w") as convo_log:
                convo_log.write(system_speech[2])

`init(self, domain='', conversation_log_dir=None, identifier=None)` `special` ¶

Service that plays the system utterance as sound

Parameters:

Name	Type	Description	Default
`domain`	`Domain`	Needed for Service, but has no meaning here	`''`
`conversation_log_dir`	`string`	If this is provided it will create log files in the specified directory.	`None`
`identifier`	`string`	Needed for Service.	`None`

Source code in adviser/services/hci/speech/SpeechOutputPlayer.py

def __init__(self, domain: Domain = "", conversation_log_dir: str = None, identifier: str = None):
    """
    Service that plays the system utterance as sound

    Args:
        domain (Domain): Needed for Service, but has no meaning here
        conversation_log_dir (string): If this is provided it will create log files in the specified directory.
        identifier (string): Needed for Service.
    """
    Service.__init__(self, domain=domain, identifier=identifier)
    self.conversation_log_dir = conversation_log_dir
    self.interaction_count = 0

`speak(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechOutputPlayer.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`SpeechRecorder` ¶

`SpeechRecorder (Service)` ¶

Source code in adviser/services/hci/speech/SpeechRecorder.py

class SpeechRecorder(Service):

    def __init__(self, domain: Union[str, Domain] = "", conversation_log_dir: str = None, enable_plotting: bool = False, threshold: int = 8000,
                 voice_privacy: bool = False, identifier: str = None) -> None:
        """
        A service that can record a microphone upon a key pressing event 
        and publish the result as an array. The end of the utterance is 
        detected automatically, also the voice can be masked to alleviate 
        privacy issues.

        Args:
            domain (Domain): I don't know why this is here. Service needs it, but it means nothing in this context.
            conversation_log_dir (string): If this parameter is given, log files of the conversation will be created in this directory
            enable_plotting (boolean): If this is set to True, the recorder is no longer real time able and thus the recordings don't work properly. This is just to be used to tune the threshold for the end of utterance detection, not during deployment.
            threshold (int): The threshold below which the assumption of the end of utterance detection is silence
            voice_privacy (boolean): Whether or not to enable the masking of the users voice
            identifier (string): I don't know why this is here. Service needs it.
        """
        Service.__init__(self, domain=domain, identifier=identifier)
        self.conversation_log_dir = conversation_log_dir
        self.recording_indicator = False
        self.audio_interface = pyaudio.PyAudio()
        self.push_to_talk_listener = keyboard.Listener(on_press=self.start_recording)
        self.threshold = threshold
        self.enable_plotting = enable_plotting
        self.voice_privacy = voice_privacy

    @PublishSubscribe(pub_topics=["speech_in"])
    def record_user_utterance(self):
        """
        Records audio once a button is pressed and stops if there is enough continuous silence.
        The numpy array consisting of the frames will be published once it's done.

        Returns:
            dict(string, tuple(np.array, int)): The utterance in form of an array and the sampling rate of the utterance
        """
        self.recording_indicator = True
        chunk = 1024  # how many frames per chunk
        audio_format = pyaudio.paInt16  # 16 bit integer based audio for quick processing
        channels = 1  # our asr model only accepts mono sounds
        sampling_rate = 16000  # only 16000 Hz works for the asr model we're using
        stream = self.audio_interface.open(format=audio_format,
                                           channels=channels,
                                           rate=sampling_rate,
                                           input=True,
                                           frames_per_buffer=chunk)
        binary_sequence = []  # this will hold the entire utterance once it's finished as binary data
        # setup for naive end of utterance detection
        continuous_seconds_of_silence_before_utterance_ends = 3.0  # this may be changed freely
        required_silence_length_to_stop_in_chunks = int(
            (continuous_seconds_of_silence_before_utterance_ends * sampling_rate) / chunk)
        reset = int((continuous_seconds_of_silence_before_utterance_ends * sampling_rate) / chunk)
        maximum_utterance_time_in_chunks = int((20 * sampling_rate) / chunk)  # 20 seconds
        if self.enable_plotting:
            threshold_plotter = self.threshold_plotter_generator()
        chunks_recorded = 0
        print("\nrecording...")
        for _ in range(maximum_utterance_time_in_chunks):
            raw_data = stream.read(chunk)
            chunks_recorded += 1
            wave_data = wave.struct.unpack("%dh" % chunk, raw_data)
            binary_sequence.append(raw_data)
            if self.enable_plotting:
                threshold_plotter(wave_data)
            if np.max(wave_data) > self.threshold:
                required_silence_length_to_stop_in_chunks = reset
            else:
                required_silence_length_to_stop_in_chunks -= 1
                if required_silence_length_to_stop_in_chunks == 0:
                    break
        print("...done recording.\n")
        stream.stop_stream()
        stream.close()
        if self.enable_plotting:
            plt.close()
        if self.conversation_log_dir is not None:
            audio_file = wave.open(
                os.path.join(self.conversation_log_dir, (str(np.math.floor(time.time())) + "_user.wav")), 'wb')
            audio_file.setnchannels(channels)
            audio_file.setsampwidth(self.audio_interface.get_sample_size(audio_format))
            audio_file.setframerate(sampling_rate)
            audio_file.writeframes(b''.join(binary_sequence))
            audio_file.close()
        self.recording_indicator = False
        audio_sequence = wave.struct.unpack("%dh" % chunk * chunks_recorded, b''.join(binary_sequence))
        if self.voice_privacy:
            return {"speech_in": (voice_sanitizer(np.array(audio_sequence, dtype=np.float32)), sampling_rate)}
        else:
            return {"speech_in": (np.array(audio_sequence, dtype=np.float32), sampling_rate)}

    def start_recording(self, key):
        """
        This method is a callback of the push to talk key
        listener. It calls the recorder, if it's not already recording.

        Args:
            key (Key): The pressed key
        """
        if (key is keyboard.Key.cmd_r or key is keyboard.Key.ctrl_r) and not self.recording_indicator:
            self.record_user_utterance()

    def start_recorder(self):
        """
        Starts the listener and outputs that the speech recorder is ready for use
        """
        self.push_to_talk_listener.start()
        print("To speak to the system, tap your right [CTRL] or [CMD] key.\n"
              "It will try to automatically detect when your utterance is over.\n")

    def threshold_plotter_generator(self):
        """
        Generates a plotter to visualize when the signal is above the set threshold

        Returns:
            function: Plots the threshold with the current continuous waveform
        """
        import matplotlib
        matplotlib.use('TkAgg')
        plt.figure(figsize=(10, 2))
        plt.axhline(y=self.threshold, xmin=0.0, xmax=1.0, color='r')
        plt.axhline(y=-self.threshold, xmin=0.0, xmax=1.0, color='r')
        plt.pause(0.000000000001)

        def threshold_plotter(data):
            plt.clf()
            plt.tight_layout()
            plt.axis([0, len(data), -20000, 20000])
            plt.plot(data, color='b')
            plt.axhline(y=self.threshold, xmin=0.0, xmax=1.0, color='r')
            plt.axhline(y=-self.threshold, xmin=0.0, xmax=1.0, color='r')
            plt.pause(0.000000000001)

        return threshold_plotter

`init(self, domain='', conversation_log_dir=None, enable_plotting=False, threshold=8000, voice_privacy=False, identifier=None)` `special` ¶

A service that can record a microphone upon a key pressing event and publish the result as an array. The end of the utterance is detected automatically, also the voice can be masked to alleviate privacy issues.

Parameters:

Name	Type	Description	Default
`domain`	`Domain`	I don't know why this is here. Service needs it, but it means nothing in this context.	`''`
`conversation_log_dir`	`string`	If this parameter is given, log files of the conversation will be created in this directory	`None`
`enable_plotting`	`boolean`	If this is set to True, the recorder is no longer real time able and thus the recordings don't work properly. This is just to be used to tune the threshold for the end of utterance detection, not during deployment.	`False`
`threshold`	`int`	The threshold below which the assumption of the end of utterance detection is silence	`8000`
`voice_privacy`	`boolean`	Whether or not to enable the masking of the users voice	`False`
`identifier`	`string`	I don't know why this is here. Service needs it.	`None`

Source code in adviser/services/hci/speech/SpeechRecorder.py

def __init__(self, domain: Union[str, Domain] = "", conversation_log_dir: str = None, enable_plotting: bool = False, threshold: int = 8000,
             voice_privacy: bool = False, identifier: str = None) -> None:
    """
    A service that can record a microphone upon a key pressing event 
    and publish the result as an array. The end of the utterance is 
    detected automatically, also the voice can be masked to alleviate 
    privacy issues.

    Args:
        domain (Domain): I don't know why this is here. Service needs it, but it means nothing in this context.
        conversation_log_dir (string): If this parameter is given, log files of the conversation will be created in this directory
        enable_plotting (boolean): If this is set to True, the recorder is no longer real time able and thus the recordings don't work properly. This is just to be used to tune the threshold for the end of utterance detection, not during deployment.
        threshold (int): The threshold below which the assumption of the end of utterance detection is silence
        voice_privacy (boolean): Whether or not to enable the masking of the users voice
        identifier (string): I don't know why this is here. Service needs it.
    """
    Service.__init__(self, domain=domain, identifier=identifier)
    self.conversation_log_dir = conversation_log_dir
    self.recording_indicator = False
    self.audio_interface = pyaudio.PyAudio()
    self.push_to_talk_listener = keyboard.Listener(on_press=self.start_recording)
    self.threshold = threshold
    self.enable_plotting = enable_plotting
    self.voice_privacy = voice_privacy

`record_user_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/speech/SpeechRecorder.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`start_recorder(self)` ¶

Starts the listener and outputs that the speech recorder is ready for use

Source code in adviser/services/hci/speech/SpeechRecorder.py

def start_recorder(self):
    """
    Starts the listener and outputs that the speech recorder is ready for use
    """
    self.push_to_talk_listener.start()
    print("To speak to the system, tap your right [CTRL] or [CMD] key.\n"
          "It will try to automatically detect when your utterance is over.\n")

`start_recording(self, key)` ¶

This method is a callback of the push to talk key listener. It calls the recorder, if it's not already recording.

Parameters:

Name	Type	Description	Default
`key`	`Key`	The pressed key	required

Source code in adviser/services/hci/speech/SpeechRecorder.py

def start_recording(self, key):
    """
    This method is a callback of the push to talk key
    listener. It calls the recorder, if it's not already recording.

    Args:
        key (Key): The pressed key
    """
    if (key is keyboard.Key.cmd_r or key is keyboard.Key.ctrl_r) and not self.recording_indicator:
        self.record_user_utterance()

`threshold_plotter_generator(self)` ¶

Generates a plotter to visualize when the signal is above the set threshold

Returns:

Type	Description
`function`	Plots the threshold with the current continuous waveform

Source code in adviser/services/hci/speech/SpeechRecorder.py

def threshold_plotter_generator(self):
    """
    Generates a plotter to visualize when the signal is above the set threshold

    Returns:
        function: Plots the threshold with the current continuous waveform
    """
    import matplotlib
    matplotlib.use('TkAgg')
    plt.figure(figsize=(10, 2))
    plt.axhline(y=self.threshold, xmin=0.0, xmax=1.0, color='r')
    plt.axhline(y=-self.threshold, xmin=0.0, xmax=1.0, color='r')
    plt.pause(0.000000000001)

    def threshold_plotter(data):
        plt.clf()
        plt.tight_layout()
        plt.axis([0, len(data), -20000, 20000])
        plt.plot(data, color='b')
        plt.axhline(y=self.threshold, xmin=0.0, xmax=1.0, color='r')
        plt.axhline(y=-self.threshold, xmin=0.0, xmax=1.0, color='r')
        plt.pause(0.000000000001)

    return threshold_plotter

`voice_sanitizer(audio)` ¶

While this is by no means a good voice sanitizer, it works as a proof of concept. It randomly shifts the spectrogram of a speakers utterance up or down, making automatic speaker identification much harder while keeping impact on asr performance as low as possible. The use should be turned off by default.

Parameters:

Name	Type	Description	Default
`audio`	`np.array`	The audio represented as array	required

Returns:

Type	Description
`np.array`	The mutated audio as array

Source code in adviser/services/hci/speech/SpeechRecorder.py

def voice_sanitizer(audio):
    """
    While this is by no means a good voice sanitizer,
    it works as a proof of concept. It randomly shifts
    the spectrogram of a speakers utterance up or down,
    making automatic speaker identification much harder
    while keeping impact on asr performance as low as
    possible. The use should be turned off by default.

    Args:
        audio (np.array): The audio represented as array

    Returns:
        np.array: The mutated audio as array
    """
    spectrogram = librosa.stft(audio)
    voice_shift = np.random.randint(3, 6)
    if np.random.choice([True, False]):
        for frequency_index, _ in enumerate(spectrogram):
            # mutate the voice to be higher
            try:
                spectrogram[len(spectrogram) - (frequency_index + 1)] = spectrogram[
                    len(spectrogram) - (frequency_index + 1 + voice_shift)]
            except IndexError:
                pass
    else:
        for frequency_index, _ in enumerate(spectrogram):
            # mutate the voice to be lower
            try:
                spectrogram[frequency_index] = spectrogram[frequency_index + voice_shift]
            except IndexError:
                pass

    return librosa.istft(spectrogram)

`cleaners` ¶

This file is derived from https://github.com/keithito/tacotron.

`basic_cleaners(text)` ¶

Basic pipeline that lowercases and collapses whitespace without transliteration.

Source code in adviser/services/hci/speech/cleaners.py

def basic_cleaners(text):
    """Basic pipeline that lowercases and collapses whitespace without transliteration."""
    text = lowercase(text)
    text = collapse_whitespace(text)
    return text

`collapse_whitespace(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def collapse_whitespace(text):
    return re.sub(_whitespace_re, ' ', text)

`convert_to_ascii(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def convert_to_ascii(text):
    return unidecode(text)

`custom_english_cleaners(text)` ¶

Custom pipeline for English text, including number and abbreviation expansion.

Source code in adviser/services/hci/speech/cleaners.py

def custom_english_cleaners(text):
    """Custom pipeline for English text, including number and abbreviation expansion."""
    text = convert_to_ascii(text)
    text = expand_email(text)
    text = expand_acronym(text)
    text = lowercase(text)
    text = expand_numbers(text)
    text = expand_abbreviations(text)
    text = expand_symbols(text)
    text = remove_unnecessary_symbols(text)
    text = uppercase(text)
    text = collapse_whitespace(text)
    return text

`english_cleaners(text)` ¶

Pipeline for English text, including number and abbreviation expansion.

Source code in adviser/services/hci/speech/cleaners.py

def english_cleaners(text):
    """Pipeline for English text, including number and abbreviation expansion."""
    text = convert_to_ascii(text)
    text = lowercase(text)
    text = expand_numbers(text)
    text = expand_abbreviations(text)
    text = collapse_whitespace(text)
    return text

`expand_abbreviations(text)` ¶

Preprocesses a text to turn abbreviations into forms that the TTS can pronounce properly

text (string): Text to be preprocessed

Source code in adviser/services/hci/speech/cleaners.py

def expand_abbreviations(text):
    """
    Preprocesses a text to turn abbreviations into forms that the TTS can pronounce properly

    text (string): Text to be preprocessed
    """
    for regex, replacement in _abbreviations:
        text = re.sub(regex, replacement, text)
    return text

`expand_acronym(text)` ¶

Preprocesses a text to turn acronyms into forms that the TTS can pronounce properly

text (string): Text to be preprocessed

Source code in adviser/services/hci/speech/cleaners.py

def expand_acronym(text):
    """
    Preprocesses a text to turn acronyms into forms that the TTS can pronounce properly

    text (string): Text to be preprocessed
    """
    for word, replacement in _acronym:
        text = re.sub(word, replacement, text)
    return text

`expand_email(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def expand_email(text):
    text = re.sub(_email_re, _expand_email, text)
    return text

`expand_numbers(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def expand_numbers(text):
    return normalize_numbers(text)

`expand_symbols(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def expand_symbols(text):
    # added
    text = re.sub(";", ",", text)
    text = re.sub(":", ",", text)
    text = re.sub("-", " ", text)
    text = re.sub("&", "and", text)
    return text

`lowercase(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def lowercase(text):
    return text.lower()

`normalize_numbers(text)` ¶

Normalizes numbers in an utterance as preparation for TTS

text (string): Text to be preprocessed

Source code in adviser/services/hci/speech/cleaners.py

def normalize_numbers(text):
    """
    Normalizes numbers in an utterance as preparation for TTS

    text (string): Text to be preprocessed
    """
    text = re.sub(_comma_number_re, _remove_commas, text)
    text = re.sub(_pounds_re, r'\1 pounds', text)
    text = re.sub(_dollars_re, _expand_dollars, text)
    text = re.sub(_decimal_number_re, _expand_decimal_point, text)
    text = re.sub(_ordinal_re, _expand_ordinal, text)
    text = re.sub(_ID_number_re, _expand_ID_number, text)
    text = re.sub(_number_re, _expand_number, text)
    return text

`remove_unnecessary_symbols(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def remove_unnecessary_symbols(text):
    # added
    text = re.sub(r'[()[]<>"]+', '', text)
    text = re.sub(r'/', ' ', text)
    return text

`transliteration_cleaners(text)` ¶

Pipeline for non-English text that transliterates to ASCII.

Source code in adviser/services/hci/speech/cleaners.py

def transliteration_cleaners(text):
    """Pipeline for non-English text that transliterates to ASCII."""
    text = convert_to_ascii(text)
    text = lowercase(text)
    text = collapse_whitespace(text)
    return text

`uppercase(text)` ¶

Source code in adviser/services/hci/speech/cleaners.py

def uppercase(text):
    # added
    return text.upper()

`speech_utility` ¶

Utility for the emotion recognition script that needs the utterance a s file

`delete_file(filepath)` ¶

Deletes the file at the given path to clean up the audio file once it's not needed anymore. This is why unique filenames are important.

filepath (string): path to the file that is to be deleted

Source code in adviser/services/hci/speech/speech_utility.py

def delete_file(filepath):
    """
    Deletes the file at the given path to clean up the audio file
    once it's not needed anymore. This is why unique filenames are
    important.

    filepath (string): path to the file that is to be deleted
    """
    if os.path.exists(filepath):
        os.remove(filepath)
    else:
        print("The file cannot be deleted, as it was not found. "
              "Please check the provided path for errors: \n{}".format(filepath))

`sound_array_to_file(filepath, sampling_rate, sound_as_array)` ¶

Saves the recording of the recorder to a file

Turns the audio from the recorder service into a wav file for processing with opensmile c++ scripts

filepath (string): full path, including filename and .wav suffix at an arbitrary location. Careful: python takes paths as relative to the main script. The name should be unique, to ensure files don't get mixed up if there are multiple calls in short time and one file might get overwriteen or deleted before it's done being processed. sampling_rate (int): the sampling rate of the audio, as published by the recorder sound_as_array (np.array): the audio in form of an array as published by the recorder

Source code in adviser/services/hci/speech/speech_utility.py

def sound_array_to_file(filepath, sampling_rate, sound_as_array):
    """
    Saves the recording of the recorder to a file

    Turns the audio from the recorder service into a wav file for 
    processing with opensmile c++ scripts 

    filepath (string): full path, including filename and .wav suffix
    at an arbitrary location. Careful: python takes paths as
    relative to the main script. The name should be unique, to
    ensure files don't get mixed up if there are multiple calls
    in short time and one file might get overwriteen or deleted
    before it's done being processed.
    sampling_rate (int): the sampling rate of the audio, as
    published by the recorder
    sound_as_array (np.array): the audio in form of an array as
    published by the recorder
    """
    librosa.output.write_wav(filepath, sound_as_array, sampling_rate)

`video` `special` ¶

`FeatureExtractor` ¶

Feature extraction with openSMILE

`VideoFeatureExtractor (Service)` ¶

TODO

Source code in adviser/services/hci/video/FeatureExtractor.py

class VideoFeatureExtractor(Service):
    """TODO"""

    def __init__(self, domain: Domain = ""):
        Service.__init__(self, domain=domain)
        self.module_dir = os.path.dirname(os.path.abspath(__file__))
        # # CLAHE (Contrast Limited Adaptive Histogram Equalization)
        self.CLAHE = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8, 8))
        # for detecting faces (returns coordinates of rectangle(s) of face area(s))
        self.DETECTOR = dlib.get_frontal_face_detector()
        # facial landmark predictor
        predictor_file = os.path.abspath(os.path.join(self.module_dir, '..', '..', '..', 'resources', 'models', 'video', 'shape_predictor_68_face_landmarks.dat'))
        self.PREDICTOR = dlib.shape_predictor(predictor_file)

    @PublishSubscribe(queued_sub_topics=["video_input"], sub_topics=["user_acts"],
                      pub_topics=["fl_features"])
    def extract_fl_features(self, video_input, user_acts):
        """TODO

        Returns:
            dict: TODO
        """
        def _distance(a, b):
            return np.linalg.norm(a-b)
        print(f'VIDEO FEATURE ENTER, len(video_input): {len(video_input)}')
        features = []
        aggregated_feats = None
        for frame in video_input[::2]:
            frame = cv2.cvtColor(frame, cv2.COLOR_RGB2GRAY)
            frame = self.CLAHE.apply(frame)
            faces = self.DETECTOR(frame, 1)
            if len(faces) > 0:  # at least one face detected
                landmarks = self.PREDICTOR(frame, faces[0])
                landmarks = face_utils.shape_to_np(landmarks)
                norm_left_eye = _distance(landmarks[21], landmarks[39])
                norm_right_eye = _distance(landmarks[22], landmarks[42])
                norm_lips = _distance(landmarks[33], landmarks[52])
                eyebrow_left = sum(
                    [(_distance(landmarks[39], landmarks[i]) / norm_left_eye)
                        for i in [18, 19, 20, 21]]
                )
                eyebrow_right = sum(
                    [(_distance(landmarks[42], landmarks[i]) / norm_right_eye)
                        for i in [22, 23, 24, 25]]
                )
                lip_left = sum(
                    [(_distance(landmarks[33], landmarks[i]) / norm_lips)
                        for i in [48, 49, 50]]
                )
                lip_right = sum(
                    [(_distance(landmarks[33], landmarks[i]) / norm_lips)
                        for i in [52, 53, 54]]
                )
                mouth_width = _distance(landmarks[48], landmarks[54])
                mouth_height = _distance(landmarks[51], landmarks[57])
                features.append(np.array([
                    eyebrow_left,
                    eyebrow_right,
                    lip_left,
                    lip_right,
                    mouth_width,
                    mouth_height
                ]))

        # aggregate features across frames
        if len(features) > 0:
            mean = np.mean(features, axis=0)
            mini = np.amin(features, axis=0)
            maxi = np.amax(features, axis=0)
            std = np.std(features, axis=0)
            perc25 = np.percentile(features, q=25, axis=0)
            perc75 = np.percentile(features, q=75, axis=0)

            aggregated_feats = np.array([mean, mini, maxi, std, perc25, perc75]).reshape(1, 36)

        print("VIDEO FEAT PUB")
        return {'fl_features': aggregated_feats}

`init(self, domain='')` `special` ¶

Source code in adviser/services/hci/video/FeatureExtractor.py

def __init__(self, domain: Domain = ""):
    Service.__init__(self, domain=domain)
    self.module_dir = os.path.dirname(os.path.abspath(__file__))
    # # CLAHE (Contrast Limited Adaptive Histogram Equalization)
    self.CLAHE = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8, 8))
    # for detecting faces (returns coordinates of rectangle(s) of face area(s))
    self.DETECTOR = dlib.get_frontal_face_detector()
    # facial landmark predictor
    predictor_file = os.path.abspath(os.path.join(self.module_dir, '..', '..', '..', 'resources', 'models', 'video', 'shape_predictor_68_face_landmarks.dat'))
    self.PREDICTOR = dlib.shape_predictor(predictor_file)

`extract_fl_features(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/video/FeatureExtractor.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`VideoInput` ¶

`VideoInput (Service)` ¶

Captures frames with a specified capture interval between two consecutive dialog turns and returns a list of frames.

Source code in adviser/services/hci/video/VideoInput.py

class VideoInput(Service):
    """
    Captures frames with a specified capture interval between two consecutive dialog turns and returns a list of frames.
    """

    def __init__(self, domain=None, camera_id: int = 0, capture_interval: int = 10e5, identifier: str = None):
        """
        Args:
            camera_id (int): device id (if only 1 camera device is connected, id is 0, if two are connected choose between 0 and 1, ...)
            capture_interval (int): try to capture a frame every x microseconds - is a lower bound, no hard time guarantees (e.g. 5e5 -> every >= 0.5 seconds)
        """
        Service.__init__(self, domain, identifier=identifier)

        self.cap = cv2.VideoCapture(camera_id)  # get handle to camera device
        if not self.cap.isOpened():
            self.cap.open()                     # open

        self.terminating = Event()
        self.terminating.clear()
        self.capture_thread = Thread(target=self.capture) # create thread object for capturing
        self.capture_interval = capture_interval

    def capture(self):
        """
        Continuous video capture, meant to be run in a loop.
        Calls `publish_img` once per interval tick to publish the captured image.
        """
        while self.cap.isOpened() and not self.terminating.isSet():
            start_time = datetime.datetime.now()

            # Capture frame-by-frame
            # cap.read() returns a bool (true when frame was read correctly)
            ret, frame = self.cap.read()
            # Our operations on the frame come here
            if ret:
                rgb_img = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
                self.publish_img(rgb_img=rgb_img)

            end_time = datetime.datetime.now()
            time_diff = end_time - start_time
            wait_seconds = (self.capture_interval - time_diff.microseconds)*1e-6   # note: time to wait for next capture to match specified sampling rate in seconds
            if wait_seconds > 0.0:
                time.sleep(wait_seconds)

        if self.cap.isOpened():
            self.cap.release()

    def dialog_end(self):
        self.terminating.set()

    def dialog_start(self):
        if not self.capture_thread.is_alive():
            print("Starting video capture...")
            self.capture_thread.start()

    @PublishSubscribe(pub_topics=['video_input'])
    def publish_img(self, rgb_img) -> dict(video_input=List[object]):
        """
        Helper function to publish images from a loop.
        """
        return {'video_input': rgb_img}  # NOTE: in the future, copy frames for more safety (capturing thread may overwrite them)

`init(self, domain=None, camera_id=0, capture_interval=1000000.0, identifier=None)` `special` ¶

Parameters:

Name	Type	Description	Default
`camera_id`	`int`	device id (if only 1 camera device is connected, id is 0, if two are connected choose between 0 and 1, ...)	`0`
`capture_interval`	`int`	try to capture a frame every x microseconds - is a lower bound, no hard time guarantees (e.g. 5e5 -> every >= 0.5 seconds)	`1000000.0`

Source code in adviser/services/hci/video/VideoInput.py

def __init__(self, domain=None, camera_id: int = 0, capture_interval: int = 10e5, identifier: str = None):
    """
    Args:
        camera_id (int): device id (if only 1 camera device is connected, id is 0, if two are connected choose between 0 and 1, ...)
        capture_interval (int): try to capture a frame every x microseconds - is a lower bound, no hard time guarantees (e.g. 5e5 -> every >= 0.5 seconds)
    """
    Service.__init__(self, domain, identifier=identifier)

    self.cap = cv2.VideoCapture(camera_id)  # get handle to camera device
    if not self.cap.isOpened():
        self.cap.open()                     # open

    self.terminating = Event()
    self.terminating.clear()
    self.capture_thread = Thread(target=self.capture) # create thread object for capturing
    self.capture_interval = capture_interval

`capture(self)` ¶

Continuous video capture, meant to be run in a loop. Calls publish_img once per interval tick to publish the captured image.

Source code in adviser/services/hci/video/VideoInput.py

def capture(self):
    """
    Continuous video capture, meant to be run in a loop.
    Calls `publish_img` once per interval tick to publish the captured image.
    """
    while self.cap.isOpened() and not self.terminating.isSet():
        start_time = datetime.datetime.now()

        # Capture frame-by-frame
        # cap.read() returns a bool (true when frame was read correctly)
        ret, frame = self.cap.read()
        # Our operations on the frame come here
        if ret:
            rgb_img = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
            self.publish_img(rgb_img=rgb_img)

        end_time = datetime.datetime.now()
        time_diff = end_time - start_time
        wait_seconds = (self.capture_interval - time_diff.microseconds)*1e-6   # note: time to wait for next capture to match specified sampling rate in seconds
        if wait_seconds > 0.0:
            time.sleep(wait_seconds)

    if self.cap.isOpened():
        self.cap.release()

`dialog_end(self)` ¶

This function is called after a dialog ended (Topics.DIALOG_END message was received). You should overwrite this function to record dialog-level information.

Source code in adviser/services/hci/video/VideoInput.py

def dialog_end(self):
    self.terminating.set()

`dialog_start(self)` ¶

This function is called before the first message to a new dialog is published. You should overwrite this function to set/reset dialog-level variables.

Source code in adviser/services/hci/video/VideoInput.py

def dialog_start(self):
    if not self.capture_thread.is_alive():
        print("Starting video capture...")
        self.capture_thread.start()

`publish_img(self, *args, **kwargs)` ¶

Source code in adviser/services/hci/video/VideoInput.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`nlg` `special` ¶

`all` `special` ¶

`affective_nlg` ¶

Handcrafted (i.e. template-based) Natural Language Generation Module

`HandcraftedEmotionNLG (HandcraftedNLG)` ¶

A child of the HandcraftedNLG, the HandcraftedEmotionNLG can choose between multiple affective response templates for each sys_act dependingon the current sys_emotion

Source code in adviser/services/nlg/affective_nlg.py

class HandcraftedEmotionNLG(HandcraftedNLG):
    """
        A child of the HandcraftedNLG, the HandcraftedEmotionNLG can choose between multiple affective
        response templates for each sys_act dependingon the current sys_emotion
    """
    def __init__(self, domain: Domain, sub_topic_domains={}, template_file: str = None,
                 logger: DiasysLogger = DiasysLogger(), template_file_german: str = None,
                 emotions: List[str] = [], debug_logger = None):
        """Constructor mainly extracts methods and rules from the template file"""
        Service.__init__(self, domain=domain, sub_topic_domains=sub_topic_domains, debug_logger=debug_logger)

        self.domain = domain
        self.template_filename = template_file
        self.templates = {}
        self.logger = logger
        self.emotions = emotions

        self._initialise_templates()


    @PublishSubscribe(sub_topics=["sys_act", "sys_emotion", "sys_engagement"], pub_topics=["sys_utterance"])
    def generate_system_utterance(self, sys_act: SysAct = None, sys_emotion: str = None,
                                  sys_engagement: str = None) -> dict(sys_utterance=str):
        """

        Takes a system act, system emotion choice, and system engagement level choice, then
        searches for a fitting rule, applies it and returns the message.

        Args:
            sys_act (SysAct): The system act, to check whether the dialogue was finished
            sys_emotion (str): A string representing the system's choice of emotional response
            sys_engagement (str): A string representing how engaged the system thinks the user is

        Returns:
            dict: a dict containing the system utterance
        """
        rule_found = True
        message = ""
        try:
            message = self.templates[sys_emotion].create_message(sys_act)
        except BaseException as error:
            rule_found = False
            self.logger.error(error)
            raise(error)

        # inform if no applicable rule could be found in the template file
        if not rule_found:
            self.logger.info('Could not find a fitting rule for the given system act!')
            self.logger.info("System Action: " + str(sys_act.type)
                             + " - Slots: " + str(sys_act.slot_values))

        # self.logger.dialog_turn("System Action: " + message)
        return {'sys_utterance': message}

    def _initialise_templates(self):
        """
            Loads the correct template file based on which language has been selected
            this should only be called on the first turn of the dialog

            Args:
                language (Language): Enum representing the language the user has selected
        """
        for emotion in self.emotions:
            self.templates[emotion.lower()] = TemplateFile(os.path.join(
                os.path.dirname(os.path.abspath(__file__)),
                f'../../resources/nlg_templates/{self.domain.get_domain_name()}Messages{emotion}.nlg'),
                self.domain)
        self.templates["neutral"] = TemplateFile(os.path.join(
            os.path.dirname(os.path.abspath(__file__)),
            f'../../resources/nlg_templates/{self.domain.get_domain_name()}Messages.nlg'),
            self.domain)

        self._add_additional_methods_for_template_file()

    def _add_additional_methods_for_template_file(self):
        """add the function prefixed by "_template_" to the template file interpreter"""
        for (method_name, method) in inspect.getmembers(type(self), inspect.isfunction):
            if method_name.startswith('_template_'):
                for emotion in self.templates:
                    self.templates[emotion].add_python_function(method_name[10:], method, [self])

`init(self, domain, sub_topic_domains={}, template_file=None, logger=<DiasysLogger adviser (NOTSET)>, template_file_german=None, emotions=[], debug_logger=None)` `special` ¶

Source code in adviser/services/nlg/affective_nlg.py

def __init__(self, domain: Domain, sub_topic_domains={}, template_file: str = None,
             logger: DiasysLogger = DiasysLogger(), template_file_german: str = None,
             emotions: List[str] = [], debug_logger = None):
    """Constructor mainly extracts methods and rules from the template file"""
    Service.__init__(self, domain=domain, sub_topic_domains=sub_topic_domains, debug_logger=debug_logger)

    self.domain = domain
    self.template_filename = template_file
    self.templates = {}
    self.logger = logger
    self.emotions = emotions

    self._initialise_templates()

`generate_system_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/nlg/affective_nlg.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`bc_nlg` ¶

Handcrafted (i.e. template-based) Natural Language Generation Module with backchannel

`BackchannelHandcraftedNLG (HandcraftedNLG)` ¶

Handcrafted (i.e. template-based) Natural Language Generation Module

A rule-based approach on natural language generation. The rules have to be specified within a template file using the ADVISER NLG syntax. Python methods that are called within a template file must be specified in the HandcraftedNLG class by using the prefix "template". For example, the method "_template_genitive_s" can be accessed in the template file via calling {genitive_s(name)}

Attributes:

Name	Type	Description
`domain`	`Domain`	the domain
`template_filename`	`str`	the NLG template filename
`templates`	`TemplateFile`	the parsed and ready-to-go NLG template file
`template_english`	`str`	the name of the English NLG template file
`template_german`	`str`	the name of the German NLG template file
`language`	`Language`	the language of the dialogue

Source code in adviser/services/nlg/bc_nlg.py

class BackchannelHandcraftedNLG(HandcraftedNLG):
    """Handcrafted (i.e. template-based) Natural Language Generation Module

    A rule-based approach on natural language generation.
    The rules have to be specified within a template file using the ADVISER NLG syntax.
    Python methods that are called within a template file must be specified in the
    HandcraftedNLG class by using the prefix "_template_". For example, the method
    "_template_genitive_s" can be accessed in the template file via calling {genitive_s(name)}

    Attributes:
        domain (Domain): the domain
        template_filename (str): the NLG template filename
        templates (TemplateFile): the parsed and ready-to-go NLG template file
        template_english (str): the name of the English NLG template file
        template_german (str): the name of the German NLG template file
        language (Language): the language of the dialogue
    """
    def __init__(self, domain: Domain, sub_topic_domains: Dict[str, str] = {}, template_file: str = None,
                 logger: DiasysLogger = DiasysLogger(), template_file_german: str = None,
                 language: Language = None):
        """Constructor mainly extracts methods and rules from the template file"""
        HandcraftedNLG.__init__(
            self, domain, template_file=None,
            logger=DiasysLogger(), template_file_german=None,
            language=None, sub_topic_domains=sub_topic_domains)

        # class_int_mapping = {0: b'no_bc', 1: b'assessment', 2: b'continuer'}
        self.backchannels = {
            0: [''],
            1: ['Okay. ', 'Yeah. '],
            2: ['Um-hum. ', 'Uh-huh. ']
        }

    @PublishSubscribe(sub_topics=["sys_act", 'predicted_BC'], pub_topics=["sys_utterance"])
    def publish_system_utterance(self, sys_act: SysAct = None, predicted_BC: int = None) -> dict(sys_utterance=str):
        """
        Takes a system act, searches for a fitting rule, adds, backchannel and applies it
        and returns the message.
        mapping = {0: b'no_bc', 1: b'assessment', 2: b'continuer'}

        Args:
            sys_act (SysAct): The system act, to check whether the dialogue was finished
            predicted_BC (int): integer representation of the BC

        Returns:
            dict: a dict containing the system utterance
        """
        rule_found = True
        message = self.generate_system_utterance(sys_act)

        if 'Sorry' not in message:
            message = self.backchannels[predicted_BC][0] + message

        return {'sys_utterance': message}

`init(self, domain, sub_topic_domains={}, template_file=None, logger=<DiasysLogger adviser (NOTSET)>, template_file_german=None, language=None)` `special` ¶

Source code in adviser/services/nlg/bc_nlg.py

def __init__(self, domain: Domain, sub_topic_domains: Dict[str, str] = {}, template_file: str = None,
             logger: DiasysLogger = DiasysLogger(), template_file_german: str = None,
             language: Language = None):
    """Constructor mainly extracts methods and rules from the template file"""
    HandcraftedNLG.__init__(
        self, domain, template_file=None,
        logger=DiasysLogger(), template_file_german=None,
        language=None, sub_topic_domains=sub_topic_domains)

    # class_int_mapping = {0: b'no_bc', 1: b'assessment', 2: b'continuer'}
    self.backchannels = {
        0: [''],
        1: ['Okay. ', 'Yeah. '],
        2: ['Um-hum. ', 'Uh-huh. ']
    }

`publish_system_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/nlg/bc_nlg.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`nlg` ¶

Handcrafted (i.e. template-based) Natural Language Generation Module

`HandcraftedNLG (Service)` ¶

Handcrafted (i.e. template-based) Natural Language Generation Module

A rule-based approach on natural language generation. The rules have to be specified within a template file using the ADVISER NLG syntax. Python methods that are called within a template file must be specified in the HandcraftedNLG class by using the prefix "template". For example, the method "_template_genitive_s" can be accessed in the template file via calling {genitive_s(name)}

Attributes:

Name	Type	Description
`domain`	`Domain`	the domain
`template_filename`	`str`	the NLG template filename
`templates`	`TemplateFile`	the parsed and ready-to-go NLG template file
`template_english`	`str`	the name of the English NLG template file
`template_german`	`str`	the name of the German NLG template file
`language`	`Language`	the language of the dialogue

Source code in adviser/services/nlg/nlg.py

class HandcraftedNLG(Service):
    """Handcrafted (i.e. template-based) Natural Language Generation Module

    A rule-based approach on natural language generation.
    The rules have to be specified within a template file using the ADVISER NLG syntax.
    Python methods that are called within a template file must be specified in the
    HandcraftedNLG class by using the prefix "_template_". For example, the method
    "_template_genitive_s" can be accessed in the template file via calling {genitive_s(name)}

    Attributes:
        domain (Domain): the domain
        template_filename (str): the NLG template filename
        templates (TemplateFile): the parsed and ready-to-go NLG template file
        template_english (str): the name of the English NLG template file
        template_german (str): the name of the German NLG template file
        language (Language): the language of the dialogue
    """
    def __init__(self, domain: Domain, template_file: str = None, sub_topic_domains: Dict[str, str] = {},
                 logger: DiasysLogger = DiasysLogger(), template_file_german: str = None,
                 language: Language = None):
        """Constructor mainly extracts methods and rules from the template file"""
        Service.__init__(self, domain=domain, sub_topic_domains=sub_topic_domains)

        self.language = language if language else Language.ENGLISH
        self.template_english = template_file
        # TODO: at some point if we expand languages, maybe make kwargs? --LV
        self.template_german = template_file_german
        self.domain = domain
        self.template_filename = None
        self.templates = None
        self.logger = logger

        self.language = Language.ENGLISH
        self._initialise_language(self.language)


    @PublishSubscribe(sub_topics=["sys_act"], pub_topics=["sys_utterance"])
    def publish_system_utterance(self, sys_act: SysAct = None) -> dict(sys_utterance=str):
        """Generates the system utterance and publishes it.

        Args:
            sys_act (SysAct): The system act published by the policy

        Returns:
            dict: a dict containing the system utterance
        """
        return {'sys_utterance': self.generate_system_utterance(sys_act)}


    def generate_system_utterance(self, sys_act: SysAct = None) -> str:
        """Main function of the NLG module

        Takes a system act, searches for a fitting rule, applies it and returns the message.
        Overwrite this function if you inherit from the NLG module.

        Args:
            sys_act (SysAct): The system act

        Returns:
            The utterance generated by applying a fitting template
        """
        rule_found = True
        message = ""
        try:
            message = self.templates.create_message(sys_act)
        except BaseException as error:
            rule_found = False
            self.logger.error(error)
            raise(error)

        # inform if no applicable rule could be found in the template file
        if not rule_found:
            self.logger.info('Could not find a fitting rule for the given system act!')
            self.logger.info("System Action: " + str(sys_act.type)
                             + " - Slots: " + str(sys_act.slot_values))

        # self.logger.dialog_turn("System Action: " + message)
        return message


    def _initialise_language(self, language: Language):
        """
            Loads the correct template file based on which language has been selected
            this should only be called on the first turn of the dialog

            Args:
                language (Language): Enum representing the language the user has selected
        """
        if language == Language.ENGLISH:
            if self.template_english is None:
                self.template_filename = os.path.join(
                    os.path.dirname(os.path.abspath(__file__)),
                    '../../resources/nlg_templates/%sMessages.nlg' % self.domain.get_domain_name())
            else:
                self.template_filename = self.template_english
        if language == Language.GERMAN:
            if self.template_german is None:
                self.template_filename = os.path.join(
                    os.path.dirname(os.path.abspath(__file__)),
                    '../../resources/nlg_templates/{}MessagesGerman.nlg'.format(
                        self.domain.get_domain_name()))
            else:
                self.template_filename = self.template_german

        self.templates = TemplateFile(self.template_filename, self.domain)
        self._add_additional_methods_for_template_file()

    def _add_additional_methods_for_template_file(self):
        """add the function prefixed by "_template_" to the template file interpreter"""
        for (method_name, method) in inspect.getmembers(type(self), inspect.isfunction):
            if method_name.startswith('_template_'):
                self.templates.add_python_function(method_name[10:], method, [self])

    def _template_genitive_s(self, name: str) -> str:
        if name[-1] == 's':
            return f"{name}'"
        else:
            return f"{name}'s"

    def _template_genitive_s_german(self, name: str) -> str:
        if name[-1] in ('s', 'x', 'ß', 'z'):
            return f"{name}'"
        else:
            return f"{name}s"

`init(self, domain, template_file=None, sub_topic_domains={}, logger=<DiasysLogger adviser (NOTSET)>, template_file_german=None, language=None)` `special` ¶

Constructor mainly extracts methods and rules from the template file

Source code in adviser/services/nlg/nlg.py

def __init__(self, domain: Domain, template_file: str = None, sub_topic_domains: Dict[str, str] = {},
             logger: DiasysLogger = DiasysLogger(), template_file_german: str = None,
             language: Language = None):
    """Constructor mainly extracts methods and rules from the template file"""
    Service.__init__(self, domain=domain, sub_topic_domains=sub_topic_domains)

    self.language = language if language else Language.ENGLISH
    self.template_english = template_file
    # TODO: at some point if we expand languages, maybe make kwargs? --LV
    self.template_german = template_file_german
    self.domain = domain
    self.template_filename = None
    self.templates = None
    self.logger = logger

    self.language = Language.ENGLISH
    self._initialise_language(self.language)

`generate_system_utterance(self, sys_act=None)` ¶

Main function of the NLG module

Takes a system act, searches for a fitting rule, applies it and returns the message. Overwrite this function if you inherit from the NLG module.

Parameters:

Name	Type	Description	Default
`sys_act`	`SysAct`	The system act	`None`

Returns:

Type	Description
`str`	The utterance generated by applying a fitting template

Source code in adviser/services/nlg/nlg.py

def generate_system_utterance(self, sys_act: SysAct = None) -> str:
    """Main function of the NLG module

    Takes a system act, searches for a fitting rule, applies it and returns the message.
    Overwrite this function if you inherit from the NLG module.

    Args:
        sys_act (SysAct): The system act

    Returns:
        The utterance generated by applying a fitting template
    """
    rule_found = True
    message = ""
    try:
        message = self.templates.create_message(sys_act)
    except BaseException as error:
        rule_found = False
        self.logger.error(error)
        raise(error)

    # inform if no applicable rule could be found in the template file
    if not rule_found:
        self.logger.info('Could not find a fitting rule for the given system act!')
        self.logger.info("System Action: " + str(sys_act.type)
                         + " - Slots: " + str(sys_act.slot_values))

    # self.logger.dialog_turn("System Action: " + message)
    return message

`publish_system_utterance(self, *args, **kwargs)` ¶

Source code in adviser/services/nlg/nlg.py

def delegate(self, *args, **kwargs):
    func_inst = getattr(self, func.__name__)

    callargs = list(args)
    if self in callargs:    # remove self when in *args, because already known to function
        callargs.remove(self)
    result = func(self, *callargs, **kwargs)
    if result:
        # fix! (user could have multiple "/" characters in topic - only use last one )
        domains = {res.split("/")[0]: res.split("/")[1] if "/" in res else "" for res in result}
        result = {key.split("/")[0]: result[key] for key in result}

    if func_inst not in self._publish_sockets:
        # not a publisher, just normal function
        return result

    socket = self._publish_sockets[func_inst]
    domain = self._domain_name
    if socket and result:
        # publish messages
        for topic in pub_topics:
        # for topic in result: # NOTE publish any returned value in dict with it's key as topic
            if topic in result:
                domain = domain if domain else domains[topic]
                topic_domain_str = f"{topic}/{domain}" if domain else topic
                if topic in self._pub_topic_domains:
                    topic_domain_str = f"{topic}/{self._pub_topic_domains[topic]}" if self._pub_topic_domains[topic] else topic
                _send_msg(socket, topic_domain_str, result[topic])
                if self.debug_logger:
                    self.debug_logger.info(
                        f"- (DS): sent message from {func} to topic {topic_domain_str}:\n   {result[topic]}")
    return result

`templates` `special` ¶

`builtinfunctions` ¶

`ForEntryFunction (Function)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

class ForEntryFunction(Function):
    def __init__(self, global_memory):
        Function.__init__(self, 'for_entry(slots, function, separator_first, separator_last)')
        self.global_memory = global_memory

    def is_applicable(self, parameters: Memory) -> bool:
        return len(parameters.variables) >= 4

    def apply(self, parameters: Memory = None) -> str:
        function = parameters.get_function(parameters.variables[1].value)
        extra_arguments = [variable.value for variable in parameters.variables[4:]]
        texts: List[str] = []

        for slot_value_pair in parameters.variables[0].value:
            memory = self._build_memory(slot_value_pair[0], slot_value_pair[1], extra_arguments)
            if not function.is_applicable(memory):
                raise BaseException(f'The function {function.function_name} could not be called '
                                    f'from the for_entry function')
            texts.append(function.apply(memory))

        return self._create_text_from_elements(texts, parameters.variables[2].value,
                                               parameters.variables[3].value)

    def _build_memory(self, slot: str, value: str, arguments: List[str]):
        memory = Memory(self.global_memory)
        memory.add_variable(Variable('slot', slot))
        memory.add_variable(Variable('value', value))
        for i, argument in enumerate(arguments):
            memory.add_variable(Variable(f'arg{i}', argument))
        return memory

    def _create_text_from_elements(self, elements: List[str], separator: str, last_separator: str):
        if not elements:
            return ''
        if len(elements) == 1:
            return elements[0]
        text = elements[0]
        for i in range(1, len(elements) - 1):
            text += separator + elements[i]
        text += last_separator + elements[-1]
        return text

`init(self, global_memory)` `special` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def __init__(self, global_memory):
    Function.__init__(self, 'for_entry(slots, function, separator_first, separator_last)')
    self.global_memory = global_memory

`apply(self, parameters=None)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def apply(self, parameters: Memory = None) -> str:
    function = parameters.get_function(parameters.variables[1].value)
    extra_arguments = [variable.value for variable in parameters.variables[4:]]
    texts: List[str] = []

    for slot_value_pair in parameters.variables[0].value:
        memory = self._build_memory(slot_value_pair[0], slot_value_pair[1], extra_arguments)
        if not function.is_applicable(memory):
            raise BaseException(f'The function {function.function_name} could not be called '
                                f'from the for_entry function')
        texts.append(function.apply(memory))

    return self._create_text_from_elements(texts, parameters.variables[2].value,
                                           parameters.variables[3].value)

`is_applicable(self, parameters)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def is_applicable(self, parameters: Memory) -> bool:
    return len(parameters.variables) >= 4

`ForEntryListFunction (Function)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

class ForEntryListFunction(Function):
    def __init__(self, global_memory: GlobalMemory):
        Function.__init__(self, 'for_entry_list(slots, function, value_sep, value_sep_last, '
                                'slot_sep, slot_sep_last)')
        self.global_memory = global_memory

    def is_applicable(self, parameters: Memory) -> bool:
        return len(parameters.variables) >= 6

    def apply(self, parameters: Memory = None) -> str:
        function = parameters.get_function(parameters.variables[1].value)
        extra_arguments = [variable.value for variable in parameters.variables[6:]]
        texts_per_slot: List[str] = []

        for slot_values_pair in parameters.variables[0].value:
            slot_texts: List[str] = []
            for value in slot_values_pair[1]:            
                memory = self._build_memory(slot_values_pair[0], value, extra_arguments)
                if not function.is_applicable(memory):
                    raise BaseException(f'The function {function.function_name} could not be '
                                        f'called from the for_entry_list function')
                slot_texts.append(function.apply(memory))
            text = self._create_text_from_elements(slot_texts, parameters.variables[2].value,
                                                   parameters.variables[3].value)
            texts_per_slot.append(text)

        return self._create_text_from_elements(texts_per_slot, parameters.variables[4].value,
                                               parameters.variables[5].value)

    def _build_memory(self, slot: str, value: str, arguments: List[str]):
        memory = Memory(self.global_memory)
        memory.add_variable(Variable('slot', slot))
        memory.add_variable(Variable('value', value))
        for i, argument in enumerate(arguments):
            memory.add_variable(Variable(f'arg{i}', argument))
        return memory

    def _create_text_from_elements(self, elements: List[str], separator: str, last_separator: str):
        if not elements:
            return ''
        if len(elements) == 1:
            return elements[0]
        text = elements[0]
        for i in range(1, len(elements) - 1):
            text += separator + elements[i]
        text += last_separator + elements[-1]
        return text

`init(self, global_memory)` `special` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def __init__(self, global_memory: GlobalMemory):
    Function.__init__(self, 'for_entry_list(slots, function, value_sep, value_sep_last, '
                            'slot_sep, slot_sep_last)')
    self.global_memory = global_memory

`apply(self, parameters=None)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def apply(self, parameters: Memory = None) -> str:
    function = parameters.get_function(parameters.variables[1].value)
    extra_arguments = [variable.value for variable in parameters.variables[6:]]
    texts_per_slot: List[str] = []

    for slot_values_pair in parameters.variables[0].value:
        slot_texts: List[str] = []
        for value in slot_values_pair[1]:            
            memory = self._build_memory(slot_values_pair[0], value, extra_arguments)
            if not function.is_applicable(memory):
                raise BaseException(f'The function {function.function_name} could not be '
                                    f'called from the for_entry_list function')
            slot_texts.append(function.apply(memory))
        text = self._create_text_from_elements(slot_texts, parameters.variables[2].value,
                                               parameters.variables[3].value)
        texts_per_slot.append(text)

    return self._create_text_from_elements(texts_per_slot, parameters.variables[4].value,
                                           parameters.variables[5].value)

`is_applicable(self, parameters)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def is_applicable(self, parameters: Memory) -> bool:
    return len(parameters.variables) >= 6

`ForFunction (Function)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

class ForFunction(Function):
    def __init__(self, global_memory):
        Function.__init__(self, 'for(values, function, separator_first, separator_last, *args)')
        self.global_memory = global_memory

    def is_applicable(self, parameters: Memory) -> bool:
        return len(parameters.variables) >= 4

    def apply(self, parameters: Memory = None) -> str:
        function = parameters.get_function(parameters.variables[1].value)
        extra_arguments = [variable.value for variable in parameters.variables[4:]]
        texts: List[str] = []

        for value in parameters.variables[0].value:
            memory = self._build_memory(value, extra_arguments)
            if not function.is_applicable(memory):
                raise BaseException(f'The function {function.function_name} could not be called '
                                    f'from the for function')
            texts.append(function.apply(memory))

        return self._create_text_from_elements(texts, parameters.variables[2].value,
                                               parameters.variables[3].value)

    def _build_memory(self, value: str, arguments: List[str]):
        memory = Memory(self.global_memory)
        memory.add_variable(Variable('value', value))
        for i, argument in enumerate(arguments):
            memory.add_variable(Variable(f'arg{i}', argument))
        return memory

    def _create_text_from_elements(self, elements: List[str], separator: str, last_separator: str):
        if not elements:
            return ''
        if len(elements) == 1:
            return elements[0]
        text = elements[0]
        for i in range(1, len(elements) - 1):
            text += separator + elements[i]
        text += last_separator + elements[-1]
        return text

`init(self, global_memory)` `special` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def __init__(self, global_memory):
    Function.__init__(self, 'for(values, function, separator_first, separator_last, *args)')
    self.global_memory = global_memory

`apply(self, parameters=None)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def apply(self, parameters: Memory = None) -> str:
    function = parameters.get_function(parameters.variables[1].value)
    extra_arguments = [variable.value for variable in parameters.variables[4:]]
    texts: List[str] = []

    for value in parameters.variables[0].value:
        memory = self._build_memory(value, extra_arguments)
        if not function.is_applicable(memory):
            raise BaseException(f'The function {function.function_name} could not be called '
                                f'from the for function')
        texts.append(function.apply(memory))

    return self._create_text_from_elements(texts, parameters.variables[2].value,
                                           parameters.variables[3].value)

`is_applicable(self, parameters)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def is_applicable(self, parameters: Memory) -> bool:
    return len(parameters.variables) >= 4

`PythonFunction (Function)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

class PythonFunction(Function):
    def __init__(self, function_name: str, function_to_call: Callable,
                 obligatory_arguments: List[object] = []):
        Function.__init__(self, f'{function_name}()')
        self.function = function_to_call
        self.obligatory_arguments = obligatory_arguments

    def is_applicable(self, parameters: Memory) -> bool:
        return True

    def apply(self, parameters: Memory = None) -> str:
        arguments = self.obligatory_arguments.copy()
        arguments.extend([variable.value for variable in parameters.variables])
        return self.function(*arguments)

`init(self, function_name, function_to_call, obligatory_arguments=[])` `special` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def __init__(self, function_name: str, function_to_call: Callable,
             obligatory_arguments: List[object] = []):
    Function.__init__(self, f'{function_name}()')
    self.function = function_to_call
    self.obligatory_arguments = obligatory_arguments

`apply(self, parameters=None)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def apply(self, parameters: Memory = None) -> str:
    arguments = self.obligatory_arguments.copy()
    arguments.extend([variable.value for variable in parameters.variables])
    return self.function(*arguments)

`is_applicable(self, parameters)` ¶

Source code in adviser/services/nlg/templates/builtinfunctions.py

def is_applicable(self, parameters: Memory) -> bool:
    return True

`parsing` `special` ¶

`automaton` ¶

`ModifiedPushdownAutomaton` ¶

Source code in adviser/services/nlg/templates/parsing/automaton.py

class ModifiedPushdownAutomaton:
    def __init__(self, start_state: State, accept_states: List[State],
                 state_descriptions: List[StateDescription]):
        self.start_state = start_state
        self.accept_states = accept_states
        self.state_descriptions = state_descriptions

        self.state_transition_mapping = self._create_state_transition_mapping()
        self.state_default_transition_mapping = self._create_state_default_transition_mapping()

        self.stack = AutomatonStack()

    def _create_state_transition_mapping(self) -> Dict[State, Dict[str, Transition]]:
        state_transition_mapping = {}
        for state_description in self.state_descriptions:
            input_state = state_description.default_state
            if input_state not in state_transition_mapping:
                state_transition_mapping[input_state] = {}
            for transition in state_description.transitions:
                input_char = transition.input_configuration.character
                state_transition_mapping[input_state][input_char] = transition
        return state_transition_mapping

    def _create_state_default_transition_mapping(self) -> Dict[State, DefaultTransition]:
        state_default_transition_mapping = {}
        for state_description in self.state_descriptions:
            state_default_transition_mapping[state_description.default_state] = \
                state_description.default_transition
        return state_default_transition_mapping

    def parse(self, input_tape: str) -> List[object]:
        self.stack.clear()
        current_state = self.start_state
        input_tape_index = 0

        for input_char in input_tape:
            try:
                configuration = Configuration(current_state, input_char)
                transition = self._find_transition(configuration)
                current_state = self._apply_transition(transition, configuration)
                input_tape_index += 1
            except ParsingError as error:
                print('State:', current_state.name)
                print('Index:', input_tape_index)
                print('Original Input:', input_tape)
                raise error

        if current_state not in self.accept_states:
            print('State:', current_state.name)
            raise ParsingError(f'Parser was not in a final state after the input tape was read.')

        return self.stack.data_stack[:]

    def _apply_transition(self, transition: Transition,
                          input_configuration: Configuration) -> State:
        transition.perform_stack_action(self.stack, input_configuration)
        output_configuration = transition.get_output_configuration(input_configuration)
        self.stack.add_char(output_configuration.character)
        return output_configuration.state

    def _find_transition(self, configuration: Configuration):
        if configuration.state not in self.state_transition_mapping or \
            configuration.character not in self.state_transition_mapping[configuration.state]:
            return self._find_default_transition(configuration.state)
        return self.state_transition_mapping[configuration.state][configuration.character]

    def _find_default_transition(self, current_state: State):
        if current_state not in self.state_default_transition_mapping:
            raise ParsingError(f'No default transition found for state {current_state.name}.')
        return self.state_default_transition_mapping.get(current_state, None)

__init__(self, start_state, accept_states, state_descriptions) special ¶

Source code in adviser/services/nlg/templates/parsing/automaton.py

def __init__(self, start_state: State, accept_states: List[State],
             state_descriptions: List[StateDescription]):
    self.start_state = start_state
    self.accept_states = accept_states
    self.state_descriptions = state_descriptions

    self.state_transition_mapping = self._create_state_transition_mapping()
    self.state_default_transition_mapping = self._create_state_default_transition_mapping()

    self.stack = AutomatonStack()

parse(self, input_tape) ¶

Source code in adviser/services/nlg/templates/parsing/automaton.py

def parse(self, input_tape: str) -> List[object]:
    self.stack.clear()
    current_state = self.start_state
    input_tape_index = 0

    for input_char in input_tape:
        try:
            configuration = Configuration(current_state, input_char)
            transition = self._find_transition(configuration)
            current_state = self._apply_transition(transition, configuration)
            input_tape_index += 1
        except ParsingError as error:
            print('State:', current_state.name)
            print('Index:', input_tape_index)
            print('Original Input:', input_tape)
            raise error

    if current_state not in self.accept_states:
        print('State:', current_state.name)
        raise ParsingError(f'Parser was not in a final state after the input tape was read.')

    return self.stack.data_stack[:]