Merge pull request #24 from emrgnt-cmplxty/feature/add-hugging-face-r…

…ebased2 Feature/add hugging face rebased2
emrgnt-cmplxty · Aug 25, 2023 · 3861cf1 · 3861cf1
2 parents 200bfd8 + 659b980
commit 3861cf1
Show file tree

Hide file tree

Showing 9 changed files with 704 additions and 15 deletions.
diff --git a/README.md b/README.md
@@ -2,7 +2,7 @@
 
 ## Overview
 
-The Zero-Shot Replication Framework is a minimal environment designed to replicate zero-shot results from past academic papers. It currently supports OpenAI models to generate completions for various datasets and provides tools for handling, evaluating, and storing these completions.
+The Zero-Shot Replication Framework is a minimal environment designed to replicate zero-shot results from past academic papers. It currently supports OpenAI, Anthropic, and HuggingFace models to generate completions for various datasets and provides tools for handling, evaluating, and storing these completions.
 
 ## Features
 
@@ -71,15 +71,15 @@ To see explicit commands ran to generate the reported results, check out the [co
 
 ## Results (all models accessed on 08/24)
 
-| Category | gpt-3.5-turbo-0301 | gpt-3.5-turbo-0613 | Claude 2 | GPT-4-0314 | GPT-4-0613 | GPT-4 Baseline | Sources |
-|------------------|--------------------|--------------------|----------|------------|------------|----------------|----------|
-| HumanEval | 81.7 | XX  | 65.2 | 87.2 | 84.1 | 67 | [1] |
-| EvalPlus | 71.3 | XX  | 54.9 | 79.2 | 74.4 | N/A | |
-| Leetcode Easy | XX | XX | XX  | 91.0 | 88.0 | 72.2-75.6 | [1,2] |
-| Leetcode Medium | XX | XX | XX  | 26.0 | 17.0 | 26.2-38.7 | [1,2] |
-| Leetcode Hard | XX | XX | XX  | 6.0 | 4.0 | 6.7-7 | [1,2] |
-| GSM8K | XX | XX | XX | X | X | 87.1 | |
-| MATH | XX | XX | XX | 49.0 | 46.4 | 42.2 | [3] |
+| Category  | gpt-3.5-turbo-0301 | gpt-3.5-turbo-0613 | claude-2 | gpt-4-0314 | gpt-4-0613 | gpt-4 Baseline | Sources |
+|----------------------|--------------------|--------------------|----------|------------|------------|----------------|----------|
+| HumanEval  | 81.7 | 61.5 | 65.2 | 87.2 | 84.1 | 67 | [1] |
+| EvalPlus  | 71.3 | 54.2 | 54.9 | 79.2 | 74.4 | N/A | |
+| LeetCode_100 Easy | XX | XX | 73.0 | 91.0 | 88.0 | 72.2-75.6 | [1,2] |
+| LeetCode_100 Medium | XX | XX | 16.0 | 26.0 | 17.0 | 26.2-38.7 | [1,2] |
+| LeetCode_100 Hard | XX | XX | 2.0 | 6.0 | 4.0 | 6.7-7 | [1,2] |
+| GSM8K  | XX | XX | XX | X | X | 87.1 | |
+| MATH  | XX | XX | XX | 49.0 | 46.4 | 42.2 | [3] |
 
 ## License
 

diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -22,6 +22,9 @@ python-leetcode = "1.2.1"
 astunparse = "1.6.3"
 anthropic = "^0.3.10"
 numpy = "^1.25.2"
+transformers = "^4.32.0"
+torch = "^2.0.1"
+accelerate = "^0.22.0"
 
 [tool.poetry.group.dev.dependencies]
 sourcery = "^1.6.0"

diff --git a/...thropic/leetcode/claude_2/anthropic_leetcode__model_eq_claude_2__temperature_eq_0p7.jsonl b/...thropic/leetcode/claude_2/anthropic_leetcode__model_eq_claude_2__temperature_eq_0p7.jsonl
diff --git a/zero_shot_replication/helpers/utils.py b/zero_shot_replication/helpers/utils.py
@@ -100,7 +100,7 @@ def parse_arguments() -> argparse.Namespace:
 def prep_for_file_path(in_path: str) -> str:
  """Prepare a string to be used in a file path."""
 
- return in_path.replace("-", "_").replace(".", "p")
+ return in_path.replace("-", "_").replace(".", "p").replace("/", "_")
 
 
 def extract_code(raw_response: str) -> str:

diff --git a/zero_shot_replication/llm_providers/base.py b/zero_shot_replication/llm_providers/base.py
@@ -4,13 +4,21 @@
 
 
 class LLMProvider(ABC):
+ """An abstract class to provide a common interface for LLM providers."""
+
+ @abstractmethod
+ def __init__(self, model: str, temperature: float) -> None:
+ pass
+
  @abstractmethod
  def get_completion(self, prompt: str) -> str:
  pass
 
 
 @dataclass
 class ProviderConfig:
+ """A dataclass to hold the configuration for a provider."""
+
  name: str
  models: List[str]
  llm_class: Type[LLMProvider]
diff --git a/zero_shot_replication/llm_providers/huggingface.py b/zero_shot_replication/llm_providers/huggingface.py
@@ -0,0 +1,48 @@
+import torch
+import transformers
+from transformers import AutoTokenizer
+
+from zero_shot_replication.llm_providers.base import LLMProvider
+
+
+class HuggingFaceZeroShotProvider(LLMProvider):
+ """A class to provide zero-shot completions from the Anthropic API."""
+
+ MAX_TOKENS_TO_SAMPLE = (
+ 4_096 # This is a large value, we should check if it makes sense
+ )
+
+ def __init__(
+ self,
+ model: str = "facebook/opt-125m",
+ temperature: float = 0.7,
+ stream: bool = False,
+ ) -> None:
+ self.model = model
+ self.temperature = temperature
+ self.stream = stream
+ self.tokenizer = AutoTokenizer.from_pretrained(self.model)
+
+ self.pipeline = transformers.pipeline(
+ "text-generation",
+ model=self.model,
+ torch_dtype=torch.float16,
+ device_map="auto",
+ )
+
+ def get_completion(self, prompt: str) -> str:
+ """Get a completion from the Anthropic API based on the provided prompt."""
+
+ sequences = self.pipeline(
+ 'I liked "Breaking Bad" and "Band of Brothers". Do you have any recommendations of other shows I might like?\n',
+ do_sample=True,
+ top_k=10,
+ num_return_sequences=1,
+ eos_token_id=self.tokenizer.eos_token_id,
+ max_length=HuggingFaceZeroShotProvider.MAX_TOKENS_TO_SAMPLE,
+ )
+ for seq in sequences:
+ print(f"Result: {seq['generated_text']}")
+ raise NotImplementedError(
+ "HuggingFaceZeroShotProvider not implemented."
+ )
diff --git a/zero_shot_replication/llm_providers/provider_manager.py b/zero_shot_replication/llm_providers/provider_manager.py
@@ -5,6 +5,9 @@
  LLMProvider,
  ProviderConfig,
 )
+from zero_shot_replication.llm_providers.huggingface import (
+ HuggingFaceZeroShotProvider,
+)
 from zero_shot_replication.llm_providers.openai import OpenAIZeroShotProvider
 
 
@@ -25,14 +28,28 @@ class ProviderManager:
  ["claude-2", "claude-instant-1"],
  AnthropicZeroShotProvider,
  ),
+ ProviderConfig(
+ "huggingface",
+ [
+ "facebook/opt-125m", # for testing
+ "meta-llama/Llama-2-7b",
+ "meta-llama/Llama-2-13b",
+ "meta-llama/Llama-2-70b",
+ ],
+ HuggingFaceZeroShotProvider,
+ ),
  ]
 
  @staticmethod
- def get_provider(provider_name: str, model_name: str) -> LLMProvider:
+ def get_provider(
+ provider_name: str, model_name: str, temperature: float
+ ) -> LLMProvider:
  for provider in ProviderManager.PROVIDERS:
  if provider.name == provider_name:
  if model_name in provider.models:
- return provider.llm_class()
+ return provider.llm_class(
+ model=model_name, temperature=temperature
+ )
  raise ValueError(
  f"Model '{model_name}' not supported by provider '{provider_name}'"
  )

diff --git a/zero_shot_replication/runner.py b/zero_shot_replication/runner.py
@@ -53,7 +53,9 @@ def get_output_path(args: argparse.Namespace) -> str:
  out_path = get_output_path(args)
 
  # Build an LLM provider instance
- llm_provider = ProviderManager.get_provider(args.provider, args.model)
+ llm_provider = ProviderManager.get_provider(
+ args.provider, args.model, args.temperature
+ )
 
  if not llm_provider:
  raise NotImplementedError(f"Provider '{args.provider}' not supported.")