cassanof
/

CommitMessageBackwards

Text Generation

text-generation-inference

Model card Files Files and versions

cassanof commited on Jan 20, 2024

Commit

35a3912

·

verified ·

1 Parent(s): bcbf898

Update README.md

Files changed (1) hide show

README.md +53 -1

README.md CHANGED Viewed

@@ -85,4 +85,56 @@ def gen(old, new, max_new_tokens=200, temperature=0.45, top_p=0.90):
     return [tokenizer.decode(out[len(toks[0]):], skip_special_tokens=True) for out in outs]
 ```
-use the "gen" function with the old and new code

     return [tokenizer.decode(out[len(toks[0]):], skip_special_tokens=True) for out in outs]
 ```
+use the "gen" function with the old and new code
+# Example:
+```py
+- import datasets
+- from pathlib import Path
+  from code_editing.models import CodeLlamaEditModel, LlamaChatModel, EditModel, EditCommand, ChatAdaptorEditModel, OctoCoderChatModel, codellama_edit_prompt_diff, apply_rel_diff_trim, OpenAIChatModel, StarCoderCommitEditModel
+  from code_editing.humanevalpack import batch_prompts_from_example
+  from code_editing.utils import gunzip_json_write
+  from typing import List, Callable
+  from tqdm import tqdm
+  # NOTE: this is the factory for each model type. to add a new model type, add a new case here
+  # and implement it in models.py. Also, add a new case in the argument parser below.
+- def model_factory(model_type: str, quantize=False, num_gpus=1) -> Callable[[str], EditModel]:
++ def model_factory(
++         model_type: str,
++         quantize=False,
++         num_gpus=1,
++         system_supported=True,
++ ) -> Callable[[str], EditModel]:
+      if model_type == "codellama" or model_type == "deepseek":
+          return CodeLlamaEditModel
+      elif model_type == "starcoder":
+          return StarCoderCommitEditModel
+      elif model_type == "codellama-diff":
+          return (lambda path: CodeLlamaEditModel(path, prompt_format=codellama_edit_prompt_diff, post_process=apply_rel_diff_trim))
+      elif model_type == "openai":
+          return (lambda path: ChatAdaptorEditModel(OpenAIChatModel(path)))
+      elif model_type == "codellama-chat":
+-         return (lambda path: ChatAdaptorEditModel(LlamaChatModel(path, quantization=quantize, num_gpus=num_gpus)))
++         return (lambda path: ChatAdaptorEditModel(LlamaChatModel(path, quantization=quantize, num_gpus=num_gpus, system_supported=system_supported)))
+      elif model_type == "octocoder":
+          return (lambda path: ChatAdaptorEditModel(OctoCoderChatModel(path, quantization=quantize, num_gpus=num_gpus)))
+      else:
+          raise ValueError(f"Unknown model type: {model_type}")
+  def complete_problem(example: EditCommand, model: EditModel, batch_size: int, completion_limit: int, **kwargs) -> List[str]:
+      batches = batch_prompts_from_example(example, batch_size, completion_limit)
+      completions = []
+      for batch in batches:
+          resps = model.generate(batch, **kwargs)
+          for resp in resps:
+              completions.append(resp["content"])
+      return completions
+```
+Produced:
+```
+Add system_supported argument to model_factory
+```