Megatronlm client (#89)

* Adjusted .gitignore * Added client implementation for megatronlm * Minor correction * Make commit hooks happy * Use Megatron-LM server metadata * Added batching for tokenization * Adapted greedy until generation method * Fix is_max_logprobs issue * Adapted context handling for megatronlm client -> Fix high PPL for SP BPE tokenizer * Megatron-LM client: Corrected unnatural tokenization warning * Changed preparation of continuation. * Added parameter for setting bootstrap iterations --------- Co-authored-by: KlaudiaTH <[email protected]> Co-authored-by: janEbert <[email protected]>
OpenGPTX · Sep 1, 2023 · 93e3595 · 93e3595
1 parent 993faed
commit 93e3595
Show file tree

Hide file tree

Showing 4 changed files with 436 additions and 0 deletions.
diff --git a/.gitignore b/.gitignore
@@ -1,7 +1,12 @@
 env
 *.pyc
+*.log
 data/
 lm_cache
 .idea
+.vscode
+
+*.egg-info
+
 
 tests/test_cache.db
diff --git a/lm_eval/models/__init__.py b/lm_eval/models/__init__.py
@@ -2,6 +2,7 @@
 from . import gpt3
 from . import anthropic_llms
 from . import huggingface
+from . import megatronlm
 from . import textsynth
 from . import dummy
 
@@ -13,6 +14,7 @@
     "gpt2": gpt2.GPT2LM,
     "gpt3": gpt3.GPT3LM,
     "anthropic": anthropic_llms.AnthropicLM,
+    "megatronlm": megatronlm.MegatronServerLM,
     "textsynth": textsynth.TextSynthLM,
     "dummy": dummy.DummyLM,
 }