Skip to content

Commit

Permalink
feat: update model name format
Browse files Browse the repository at this point in the history
  • Loading branch information
soryxie committed Nov 17, 2023
1 parent b65cb25 commit de25ef3
Show file tree
Hide file tree
Showing 3 changed files with 78 additions and 82 deletions.
78 changes: 39 additions & 39 deletions humaneval.csv
Original file line number Diff line number Diff line change
@@ -1,39 +1,39 @@
Model,Size,pass@1,prompted
GPT-4 (May 2023),N/A,88.4,TRUE
WizardCoder-Python-34B-V1.0,34B,73.2,TRUE
ChatGPT (May 2023),N/A,73.2,TRUE
Phind-CodeLlama-34B-v2,34B,71.3,FALSE
DeepSeek-Coder,33B,51.2,FALSE
DeepSeek-Coder-instruct,33B,78.7,TRUE
DeepSeek-Coder,6.7B,47.6,FALSE
DeepSeek-Coder-instruct,6.7B,73.8,TRUE
DeepSeek-Coder-instruct,1.3B,64.6,TRUE
Mistral,7B,28.7,FALSE
Mistral-codealpaca,7B,48.2,FALSE
Zephyr β,7B,30,FALSE
StarCoder,15B,34.1,FALSE
StarCoder,1B,14.6,FALSE
StarCoder,3B,17.7,FALSE
StarCoder,7B,20.7,FALSE
CodeLlama,7B,37.8,FALSE
CodeLlama,13B,42.7,FALSE
CodeLlama,34B,51.8,FALSE
CodeT5+,2B,25,FALSE
CodeT5+,6B,29.3,FALSE
CodeT5+,16B,31.7,FALSE
CodeGen,2B,24.4,FALSE
CodeGen,6B,29.3,FALSE
CodeGen,16B,32.9,FALSE
CodeGen2,1B,11,FALSE
CodeGen2,3B,15.9,FALSE
CodeGen2,7B,18.3,FALSE
CodeGen2,16B,19.5,FALSE
Vicuna,7B,11.6,FALSE
Vicuna,13B,17.1,FALSE
SantaCoder,1.1B,14.6,FALSE
InCoder,1.3B,12.2,FALSE
InCoder,6.7B,15.9,FALSE
GPT-J,6B,12.2,FALSE
GPT-Neo,2.7B,7.9,FALSE
PolyCoder,2.7B,6.1,FALSE
StableLM,7B,2.4,FALSE
Model,pass@1,prompted
GPT-4 (May 2023),88.4,TRUE
WizardCoder-Python-34B-V1.0,73.2,TRUE
ChatGPT (May 2023),73.2,TRUE
Phind-CodeLlama-34B-v2,71.3,FALSE
DeepSeek-Coder-33B-base,51.2,FALSE
DeepSeek-Coder-33B-instruct,78.7,TRUE
DeepSeek-Coder-6.7B-base,47.6,FALSE
DeepSeek-Coder-6.7B-instruct,73.8,TRUE
DeepSeek-Coder-1.3B-instruct,64.6,TRUE
Mistral-7B,28.7,FALSE
Mistral-codealpaca-7B,48.2,FALSE
Zephyr β-7B,30,FALSE
StarCoder-15B,34.1,FALSE
StarCoder-1B,14.6,FALSE
StarCoder-3B,17.7,FALSE
StarCoder-7B,20.7,FALSE
CodeLlama-7B,37.8,FALSE
CodeLlama-13B,42.7,FALSE
CodeLlama-34B,51.8,FALSE
CodeT5+-2B,25,FALSE
CodeT5+-6B,29.3,FALSE
CodeT5+-16B,31.7,FALSE
CodeGen-2B,24.4,FALSE
CodeGen-6B,29.3,FALSE
CodeGen-16B,32.9,FALSE
CodeGen2-1B,11,FALSE
CodeGen2-3B,15.9,FALSE
CodeGen2-7B,18.3,FALSE
CodeGen2-16B,19.5,FALSE
Vicuna-7B,11.6,FALSE
Vicuna-13B,17.1,FALSE
SantaCoder-1.1B,14.6,FALSE
InCoder-1.3B,12.2,FALSE
InCoder-6.7B,15.9,FALSE
GPT-J-6B,12.2,FALSE
GPT-Neo-2.7B,7.9,FALSE
PolyCoder-2.7B,6.1,FALSE
StableLM-7B,2.4,FALSE
78 changes: 39 additions & 39 deletions humanevalplus.csv
Original file line number Diff line number Diff line change
@@ -1,39 +1,39 @@
Model,Size,pass@1,prompted
GPT-4 (May 2023),N/A,76.8,TRUE
WizardCoder-Python-34B-V1.0,34B,64.6,TRUE
ChatGPT (May 2023),N/A,64,TRUE
Phind-CodeLlama-34B-v2,34B,67.1,FALSE
DeepSeek-Coder,33B,43.3,FALSE
DeepSeek-Coder-instruct,33B,72.6,TRUE
DeepSeek-Coder,6.7B,39.6,FALSE
DeepSeek-Coder-instruct,6.7B,70.1,TRUE
DeepSeek-Coder-instruct,1.3B,58.5,TRUE
Mistral,7B,23.2,FALSE
Mistral-codealpaca,7B,40.9,FALSE
Zephyr β,7B,23.2,FALSE
StarCoder,15B,29.3,FALSE
StarCoder,1B,11,FALSE
StarCoder,3B,14.6,FALSE
StarCoder,7B,20.7,FALSE
CodeLlama,7B,34.1,FALSE
CodeLlama,13B,36.6,FALSE
CodeLlama,34B,42.7,FALSE
CodeT5+,2B,22,FALSE
CodeT5+,6B,23.8,FALSE
CodeT5+,16B,26.2,FALSE
CodeGen,2B,21.3,FALSE
CodeGen,6B,25.6,FALSE
CodeGen,16B,27.4,FALSE
CodeGen2,1B,9.1,FALSE
CodeGen2,3B,12.8,FALSE
CodeGen2,7B,16.5,FALSE
CodeGen2,16B,16.5,FALSE
Vicuna,7B,11,FALSE
Vicuna,13B,15.2,FALSE
SantaCoder,1.1B,12.8,FALSE
InCoder,1.3B,10.4,FALSE
InCoder,6.7B,12.2,FALSE
GPT-J,6B,10.4,FALSE
GPT-Neo,2.7B,6.7,FALSE
PolyCoder,2.7B,5.5,FALSE
StableLM,7B,2.4,FALSE
Model,pass@1,prompted
GPT-4 (May 2023),76.8,TRUE
WizardCoder-Python-34B-V1.0,64.6,TRUE
ChatGPT (May 2023),64,TRUE
Phind-CodeLlama-34B-v2,67.1,FALSE
DeepSeek-Coder-33B-base,43.3,FALSE
DeepSeek-Coder-33B-instruct,72.6,TRUE
DeepSeek-Coder-6.7B-base,39.6,FALSE
DeepSeek-Coder-6.7B-instruct,70.1,TRUE
DeepSeek-Coder-1.3B-instruct,58.5,TRUE
Mistral-7B,23.2,FALSE
Mistral-codealpaca-7B,40.9,FALSE
Zephyr β-7B,23.2,FALSE
StarCoder-15B,29.3,FALSE
StarCoder-1B,11,FALSE
StarCoder-3B,14.6,FALSE
StarCoder-7B,20.7,FALSE
CodeLlama-7B,34.1,FALSE
CodeLlama-13B,36.6,FALSE
CodeLlama-34B,42.7,FALSE
CodeT5+-2B,22,FALSE
CodeT5+-6B,23.8,FALSE
CodeT5+-16B,26.2,FALSE
CodeGen-2B,21.3,FALSE
CodeGen-6B,25.6,FALSE
CodeGen-16B,27.4,FALSE
CodeGen2-1B,9.1,FALSE
CodeGen2-3B,12.8,FALSE
CodeGen2-7B,16.5,FALSE
CodeGen2-16B,16.5,FALSE
Vicuna-7B,11,FALSE
Vicuna-13B,15.2,FALSE
SantaCoder-1.1B,12.8,FALSE
InCoder-1.3B,10.4,FALSE
InCoder-6.7B,12.2,FALSE
GPT-J-6B,10.4,FALSE
GPT-Neo-2.7B,6.7,FALSE
PolyCoder-2.7B,5.5,FALSE
StableLM-7B,2.4,FALSE
4 changes: 0 additions & 4 deletions leaderboard.html
Original file line number Diff line number Diff line change
Expand Up @@ -168,7 +168,6 @@ <h3>📝 Notes</h3>

const theaders = [
'Model',
'Size',
'pass@1',
]

Expand Down Expand Up @@ -252,9 +251,6 @@ <h3>📝 Notes</h3>
modelCell.appendChild(promptedSymbol);
}
dataRow.appendChild(modelCell);
var sizeCell = document.createElement('td');
sizeCell.textContent = row['Size'];
dataRow.appendChild(sizeCell);
var passCell = document.createElement('td');
if (table == originTable) {
passCell.classList.add('text-danger');
Expand Down

0 comments on commit de25ef3

Please sign in to comment.