Muennighoff commited on
Commit
15cd90d
1 Parent(s): 87bb18f

Update code_eval_octopack.py

Browse files
Files changed (1) hide show
  1. code_eval_octopack.py +9 -31
code_eval_octopack.py CHANGED
@@ -11,10 +11,8 @@
11
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
  # See the License for the specific language governing permissions and
13
  # limitations under the License.
14
- """The CodeEval metric estimates the pass@k metric for code synthesis.
15
- This is an evaluation harness for the HumanEval problem solving dataset
16
- described in the paper "Evaluating Large Language Models Trained on Code"
17
- (https://arxiv.org/abs/2107.03374)."""
18
 
19
  import itertools
20
  import os
@@ -30,35 +28,17 @@ from .execute import check_correctness
30
 
31
 
32
  _CITATION = """\
33
- @misc{chen2021evaluating,
34
- title={Evaluating Large Language Models Trained on Code},
35
- author={Mark Chen and Jerry Tworek and Heewoo Jun and Qiming Yuan \
36
- and Henrique Ponde de Oliveira Pinto and Jared Kaplan and Harri Edwards \
37
- and Yuri Burda and Nicholas Joseph and Greg Brockman and Alex Ray \
38
- and Raul Puri and Gretchen Krueger and Michael Petrov and Heidy Khlaaf \
39
- and Girish Sastry and Pamela Mishkin and Brooke Chan and Scott Gray \
40
- and Nick Ryder and Mikhail Pavlov and Alethea Power and Lukasz Kaiser \
41
- and Mohammad Bavarian and Clemens Winter and Philippe Tillet \
42
- and Felipe Petroski Such and Dave Cummings and Matthias Plappert \
43
- and Fotios Chantzis and Elizabeth Barnes and Ariel Herbert-Voss \
44
- and William Hebgen Guss and Alex Nichol and Alex Paino and Nikolas Tezak \
45
- and Jie Tang and Igor Babuschkin and Suchir Balaji and Shantanu Jain \
46
- and William Saunders and Christopher Hesse and Andrew N. Carr \
47
- and Jan Leike and Josh Achiam and Vedant Misra and Evan Morikawa \
48
- and Alec Radford and Matthew Knight and Miles Brundage and Mira Murati \
49
- and Katie Mayer and Peter Welinder and Bob McGrew and Dario Amodei \
50
- and Sam McCandlish and Ilya Sutskever and Wojciech Zaremba},
51
- year={2021},
52
- eprint={2107.03374},
53
- archivePrefix={arXiv},
54
- primaryClass={cs.LG}
55
  }
56
  """
57
 
58
  _DESCRIPTION = """\
59
- This metric implements the evaluation harness for the HumanEval problem solving dataset
60
- described in the paper "Evaluating Large Language Models Trained on Code"
61
- (https://arxiv.org/abs/2107.03374).
62
  """
63
 
64
 
@@ -110,8 +90,6 @@ with:
110
 
111
  _LICENSE = """The MIT License
112
 
113
- Copyright (c) OpenAI (https://openai.com)
114
-
115
  Permission is hereby granted, free of charge, to any person obtaining a copy
116
  of this software and associated documentation files (the "Software"), to deal
117
  in the Software without restriction, including without limitation the rights
 
11
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
  # See the License for the specific language governing permissions and
13
  # limitations under the License.
14
+ """This metric implements code evaluation with execution across multiple languages as used in the paper
15
+ "OctoPack: Instruction Tuning Code Large Language Models" (https://arxiv.org/abs/2308.07124)."""
 
 
16
 
17
  import itertools
18
  import os
 
28
 
29
 
30
  _CITATION = """\
31
+ @article{muennighoff2023octopack,
32
+ title={OctoPack: Instruction Tuning Code Large Language Models},
33
+ author={Niklas Muennighoff and Qian Liu and Armel Zebaze and Qinkai Zheng and Binyuan Hui and Terry Yue Zhuo and Swayam Singh and Xiangru Tang and Leandro von Werra and Shayne Longpre},
34
+ journal={arXiv preprint arXiv:2308.07124},
35
+ year={2023}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
36
  }
37
  """
38
 
39
  _DESCRIPTION = """\
40
+ This metric implements code evaluation with execution across multiple languages as used in the paper
41
+ "OctoPack: Instruction Tuning Code Large Language Models" (https://arxiv.org/abs/2308.07124).
 
42
  """
43
 
44
 
 
90
 
91
  _LICENSE = """The MIT License
92
 
 
 
93
  Permission is hereby granted, free of charge, to any person obtaining a copy
94
  of this software and associated documentation files (the "Software"), to deal
95
  in the Software without restriction, including without limitation the rights