JW17 commited on
Commit
e478343
·
verified ·
1 Parent(s): 440e7a8

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -3
README.md CHANGED
@@ -17,7 +17,7 @@ model-index:
17
  metrics:
18
  - name: Win Rate
19
  type: AlpacaEval 1.0
20
- value: 87.92%
21
  source:
22
  name: self-reported
23
  url: https://github.com/tatsu-lab/alpaca_eval
@@ -29,7 +29,7 @@ model-index:
29
  metrics:
30
  - name: Win Rate
31
  type: AlpacaEval 2.0
32
- value: 11.33%
33
  source:
34
  name: self-reported
35
  url: https://github.com/tatsu-lab/alpaca_eval
@@ -41,7 +41,7 @@ model-index:
41
  metrics:
42
  - name: Score
43
  type: MT-Bench
44
- value: 7.23
45
  source:
46
  name: self-reported
47
  url: https://github.com/lm-sys/FastChat/blob/main/fastchat/llm_judge/
 
17
  metrics:
18
  - name: Win Rate
19
  type: AlpacaEval 1.0
20
+ value: 91.41%
21
  source:
22
  name: self-reported
23
  url: https://github.com/tatsu-lab/alpaca_eval
 
29
  metrics:
30
  - name: Win Rate
31
  type: AlpacaEval 2.0
32
+ value: 12.20%
33
  source:
34
  name: self-reported
35
  url: https://github.com/tatsu-lab/alpaca_eval
 
41
  metrics:
42
  - name: Score
43
  type: MT-Bench
44
+ value: 7.32
45
  source:
46
  name: self-reported
47
  url: https://github.com/lm-sys/FastChat/blob/main/fastchat/llm_judge/