formatron/v0.4.11/RWKV_8py_source.html

"""

This module integrates the RWKV library by providing convenience utilities.

"""

import kbnf

import rwkv.utils

from kbnf import Token


from formatron.config import EngineGenerationConfig

from formatron.formatter import FormatterBuilder


__all__ = ["create_engine_vocabulary", "PIPELINE", "PIPELINE_ARGS"]

class PIPELINE_ARGS(rwkv.utils.PIPELINE_ARGS):

    """

    A wrapper for the arguments of the pipeline of RWKV.

    """


    def __init__(self,


                 temperature=1.0,

                 top_p=0.2,

                 top_k=0,

                 alpha_frequency=0.2,

                 alpha_presence=0.2,

                 alpha_decay=0.996,

                 token_ban=[],

                 token_stop=[],

                 chunk_len=256,

                 engine_gen_config=EngineGenerationConfig()):

        super().__init__(temperature, top_p, top_k, alpha_frequency, alpha_presence, alpha_decay, token_ban, token_stop,

                         chunk_len)

        self.engine_gen_config = engine_gen_config


def create_engine_vocabulary(WORD_NAME: str, tokenizer) -> kbnf.Vocabulary:  # NOSONAR


    """

    Create a vocabulary for the KBNF engine.

    """


    assert WORD_NAME == 'rwkv_vocab_v20230424', "Only world vocabulary is supported!"

    return kbnf.Vocabulary({k: Token(v) for k, v in tokenizer.idx2token.items()},

                           {k: v.decode("UTF-8", errors="replace") for k, v in

                            tokenizer.idx2token.items()})


class PIPELINE(rwkv.utils.PIPELINE):  # NOSONAR


    """

    A wrapper for the pipeline of RWKV.

    """


    def __init__(self, model, WORD_NAME, formatter_builder: FormatterBuilder = None):  # NOSONAR


        super().__init__(model, WORD_NAME)

        vocabulary = create_engine_vocabulary(WORD_NAME, self.tokenizer)

        formatter = formatter_builder.build(vocabulary, lambda tokens: self.tokenizer.decode(tokens))

        if formatter is not None:

            self.formatter = formatter

        else:

            self.formatter = None


    def generate(self, ctx, token_count=100, args=PIPELINE_ARGS(), callback=None, state=None):


        all_tokens = []

        out_last = 0

        out_str = ''

        occurrence = {}

        if args.engine_gen_config.reset_at_beginning and self.formatter and self.formatter.is_completed():

            self.formatter.reset()

        for i in range(token_count):

            # forward & adjust prob.

            tokens = self.encode(ctx) if i == 0 else [token]

            if self.formatter is not None:

                if i == 0 and args.engine_gen_config.read_prompt:

                    for token in tokens:

                        self.formatter.accept_token(token)

            while len(tokens) > 0:

                out, state = self.model.forward(tokens[:args.chunk_len], state)

                tokens = tokens[args.chunk_len:]

            if self.formatter and self.formatter.is_completed():

                break

            for n in args.token_ban:

                out[n] = -float('inf')

            for n in occurrence:

                out[n] -= (args.alpha_presence + occurrence[n] * args.alpha_frequency)

            if self.formatter is not None:

                formatter = self.formatter

                formatter.compute_allowed_tokens()

                out = out[:len(self.tokenizer.idx2token) + 1]  # account for the padding `0` token

                out = formatter.mask_logits(out)

            # sampler

            token = self.sample_logits(out, temperature=args.temperature, top_p=args.top_p, top_k=args.top_k)

            if self.formatter:

                self.formatter.accept_token(token)

            if token in args.token_stop:

                break

            all_tokens += [token]

            for xxx in occurrence:

                occurrence[xxx] *= args.alpha_decay


            ttt = self.decode([token])

            www = 1

            if ttt in ' \t0123456789':

                www = 0

            if token not in occurrence:

                occurrence[token] = www

            else:

                occurrence[token] += www

            # print(occurrence) # debug


            # output

            tmp = self.decode(all_tokens[out_last:])

            if '\ufffd' not in tmp:  # is valid utf-8 string?

                if callback:

                    callback(tmp)

                out_str += tmp

                out_last = i + 1

            if self.formatter and self.formatter.is_completed():

                break

        return out_str


formatron.integrations.RWKV.PIPELINE_ARGS
A wrapper for the arguments of the pipeline of RWKV.
Definition RWKV.py:16

formatron.integrations.RWKV.PIPELINE_ARGS.__init__
__init__(self, temperature=1.0, top_p=0.2, top_k=0, alpha_frequency=0.2, alpha_presence=0.2, alpha_decay=0.996, token_ban=[], token_stop=[], chunk_len=256, engine_gen_config=EngineGenerationConfig())
Definition RWKV.py:28

formatron.integrations.RWKV.PIPELINE_ARGS.engine_gen_config
engine_gen_config
Definition RWKV.py:31

formatron.integrations.RWKV.PIPELINE
A wrapper for the pipeline of RWKV.
Definition RWKV.py:47

formatron.integrations.RWKV.PIPELINE.formatter
formatter
Definition RWKV.py:54

formatron.integrations.RWKV.PIPELINE.generate
generate(self, ctx, token_count=100, args=PIPELINE_ARGS(), callback=None, state=None)
Definition RWKV.py:58

formatron.integrations.RWKV.PIPELINE.__init__
__init__(self, model, WORD_NAME, FormatterBuilder formatter_builder=None)
Definition RWKV.py:49

formatron.config
Configuration classes for Formatron.
Definition config.py:1

formatron.formatter
This module contains the Formatter class and its related classes.
Definition formatter.py:1

formatron.integrations.RWKV.create_engine_vocabulary
kbnf.Vocabulary create_engine_vocabulary(str WORD_NAME, tokenizer)
Create a vocabulary for the KBNF engine.
Definition RWKV.py:37

rwkv.utils