TheBloke
/

h2ogpt-gm-oasst1-en-2048-falcon-7b-v3-GPTQ

Text Generation

RefinedWebModel

large language model

text-generation-inference

4-bit precision

Model card Files Files and versions Community

TheBloke commited on Jul 15, 2023

Commit

9276de5

•

1 Parent(s): 24c59b6

Initial GPTQ model commit

Files changed (1) hide show

h2oai_pipeline.py +42 -0

h2oai_pipeline.py ADDED Viewed

	@@ -0,0 +1,42 @@

+from transformers import TextGenerationPipeline
+from transformers.pipelines.text_generation import ReturnType
+STYLE = "<|prompt|>{instruction}<|endoftext|><|answer|>"
+class H2OTextGenerationPipeline(TextGenerationPipeline):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.prompt = STYLE
+    def preprocess(
+        self, prompt_text, prefix="", handle_long_generation=None, **generate_kwargs
+    ):
+        prompt_text = self.prompt.format(instruction=prompt_text)
+        return super().preprocess(
+            prompt_text,
+            prefix=prefix,
+            handle_long_generation=handle_long_generation,
+            **generate_kwargs,
+        )
+    def postprocess(
+        self,
+        model_outputs,
+        return_type=ReturnType.FULL_TEXT,
+        clean_up_tokenization_spaces=True,
+    ):
+        records = super().postprocess(
+            model_outputs,
+            return_type=return_type,
+            clean_up_tokenization_spaces=clean_up_tokenization_spaces,
+        )
+        for rec in records:
+            rec["generated_text"] = (
+                rec["generated_text"]
+                .split("<|answer|>")[1]
+                .strip()
+                .split("<|prompt|>")[0]
+                .strip()
+            )
+        return records