tatsu-lab · YannDubs · May 29, 2024 · May 29, 2024
diff --git a/results/REBEL-Llama-3-8B-Instruct/model_outputs.json b/results/REBEL-Llama-3-8B-Instruct/model_outputs.json
diff --git a/results/REBEL-Llama-3-8B-Instruct/weighted_alpaca_eval_gpt4_turbo/annotations.json b/results/REBEL-Llama-3-8B-Instruct/weighted_alpaca_eval_gpt4_turbo/annotations.json
diff --git a/...lpaca_eval/leaderboards/data_AlpacaEval_2/weighted_alpaca_eval_gpt4_turbo_leaderboard.csv b/...lpaca_eval/leaderboards/data_AlpacaEval_2/weighted_alpaca_eval_gpt4_turbo_leaderboard.csv
@@ -25,6 +25,7 @@ gpt4_0613_verbose,23.237360043453418,1.283539505582624,171,630,4,805,21.49068322
 mistral-large-2402,21.43877598137888,1.2485232545097724,166,638,1,805,20.6832298136646,verified,1362,32.65207998531868,
 SPPO-Mistral7B-PairRM-ExPO,35.4431306716895,1.398130896602677,274,531,0,805,34.037267080745345,community,2288,31.822321960655582,
 Samba-CoE-v0.2-best-of-16,26.988254318335404,1.3189030000371738,201,601,3,805,25.15527950310559,community,1578,31.506544268148147,
+REBEL-Llama-3-8B-Instruct,34.30642383142354,1.3914900255573264,268,537,0,805,33.29192546583851,community,2372,31.404092262807236,
 Mixtral-8x22B-Instruct-v0.1,22.21017054750302,1.2780740057417268,174,628,3,805,21.801242236024844,verified,1445,30.878810294279383,
 SPPO-Mistral7B-PairRM,32.2453123637764,1.3908000109577154,249,556,0,805,30.93167701863354,community,2114,30.494137965217423,
 claude-2.1_verbose,24.35407109006212,1.293586209982439,191,613,1,805,23.7888198757764,dev,1414,30.29117916664986,

diff --git a/...ights/weighted_alpaca_eval_gpt4_turbo/length_controlled_v1/baseline_gpt4_1106_preview.csv b/...ights/weighted_alpaca_eval_gpt4_turbo/length_controlled_v1/baseline_gpt4_1106_preview.csv
@@ -159,4 +159,5 @@ tulu-2-dpo-70b-ExPO,-1.2584665006823457,0.4518829275713181,-1.1294862478814247
 yi-large-preview,-1.4636444959266164,0.8454473244820504,0.2120258323902696
 gpt-4o-2024-05-13,-1.3858817861289865,0.7970841059254113,0.4815647498440927
 Llama-3-Instruct-8B-SimPO,-1.1683481185229099,0.8865274658510417,-0.1621386599809119
-vicuna-13b-v1.5-togetherai,-1.9474349738548216,1.0839122246708195,-2.8324894690247078
+vicuna-13b-v1.5-togetherai,-1.9474349738548216,1.0839122246708195,-2.8324894690247078
+REBEL-Llama-3-8B-Instruct,-1.6115180568772831,0.8439736002467700,-0.9158491151077486
diff --git a/src/alpaca_eval/models_configs/REBEL-Llama-3-8B-Instruct/configs.yaml b/src/alpaca_eval/models_configs/REBEL-Llama-3-8B-Instruct/configs.yaml
@@ -0,0 +1,15 @@
+REBEL-Llama-3-8B-Instruct:
+  prompt_template: "REBEL-Llama-3-8B-Instruct/prompt.txt"
+  fn_completions: "huggingface_local_completions"
+  completions_kwargs:
+    model_name: "Cornell-AGI/REBEL-Llama-3"
+    model_kwargs:
+      torch_dtype: 'bfloat16'
+    max_new_tokens: 4096
+    temperature: 0.6
+    top_p: 0.9
+    do_sample: True
+    batch_size: 16
+    eos_token_id: 128009
+  pretty_name: "REBEL-Llama-3-8B-Instruct"
+  link: "https://huggingface.co/Cornell-AGI/REBEL-Llama-3"
diff --git a/src/alpaca_eval/models_configs/REBEL-Llama-3-8B-Instruct/prompt.txt b/src/alpaca_eval/models_configs/REBEL-Llama-3-8B-Instruct/prompt.txt
@@ -0,0 +1,4 @@
+<|start_header_id|>user<|end_header_id|>
+
+{instruction}<|eot_id|><|start_header_id|>assistant<|end_header_id|>
+
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,4 @@
		<\|start_header_id\|>user<\|end_header_id\|>

		{instruction}<\|eot_id\|><\|start_header_id\|>assistant<\|end_header_id\|>