Spaces:
Sleeping
Sleeping
Add results
Browse files- evaluate.py +0 -1
- results.json +411 -0
evaluate.py
CHANGED
|
@@ -3,7 +3,6 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
|
|
| 3 |
from distributed_training.data.dataset import DataLoader
|
| 4 |
import random
|
| 5 |
from huggingface_hub import list_repo_refs
|
| 6 |
-
import matplotlib.pyplot as plt
|
| 7 |
import json
|
| 8 |
|
| 9 |
device = "cuda"
|
|
|
|
| 3 |
from distributed_training.data.dataset import DataLoader
|
| 4 |
import random
|
| 5 |
from huggingface_hub import list_repo_refs
|
|
|
|
| 6 |
import json
|
| 7 |
|
| 8 |
device = "cuda"
|
results.json
CHANGED
|
@@ -728,6 +728,417 @@
|
|
| 728 |
],
|
| 729 |
"242": [
|
| 730 |
8.73171443939209
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 731 |
]
|
| 732 |
},
|
| 733 |
"distributed/optimized-gpt2-250m-v0.1.1": {
|
|
|
|
| 728 |
],
|
| 729 |
"242": [
|
| 730 |
8.73171443939209
|
| 731 |
+
],
|
| 732 |
+
"243": [
|
| 733 |
+
8.572042465209961
|
| 734 |
+
],
|
| 735 |
+
"244": [
|
| 736 |
+
8.52768349647522
|
| 737 |
+
],
|
| 738 |
+
"245": [
|
| 739 |
+
8.435112762451173
|
| 740 |
+
],
|
| 741 |
+
"246": [
|
| 742 |
+
8.460542488098145
|
| 743 |
+
],
|
| 744 |
+
"247": [
|
| 745 |
+
8.261814832687378
|
| 746 |
+
],
|
| 747 |
+
"248": [
|
| 748 |
+
8.407774209976196
|
| 749 |
+
],
|
| 750 |
+
"249": [
|
| 751 |
+
8.373166799545288
|
| 752 |
+
],
|
| 753 |
+
"250": [
|
| 754 |
+
8.596418190002442
|
| 755 |
+
],
|
| 756 |
+
"251": [
|
| 757 |
+
8.347005526224772
|
| 758 |
+
],
|
| 759 |
+
"252": [
|
| 760 |
+
8.623340606689453
|
| 761 |
+
],
|
| 762 |
+
"253": [
|
| 763 |
+
8.539211511611938
|
| 764 |
+
],
|
| 765 |
+
"254": [
|
| 766 |
+
8.133444905281067
|
| 767 |
+
],
|
| 768 |
+
"255": [
|
| 769 |
+
8.684558550516764
|
| 770 |
+
],
|
| 771 |
+
"256": [
|
| 772 |
+
8.315968036651611
|
| 773 |
+
],
|
| 774 |
+
"257": [
|
| 775 |
+
8.38200600941976
|
| 776 |
+
],
|
| 777 |
+
"258": [
|
| 778 |
+
8.383176326751709
|
| 779 |
+
],
|
| 780 |
+
"259": [
|
| 781 |
+
8.400863075256348
|
| 782 |
+
],
|
| 783 |
+
"260": [
|
| 784 |
+
8.305717786153158
|
| 785 |
+
],
|
| 786 |
+
"261": [
|
| 787 |
+
8.545314598083497
|
| 788 |
+
],
|
| 789 |
+
"262": [
|
| 790 |
+
8.483990287780761
|
| 791 |
+
],
|
| 792 |
+
"263": [
|
| 793 |
+
8.214628791809082
|
| 794 |
+
],
|
| 795 |
+
"264": [
|
| 796 |
+
8.310606002807617
|
| 797 |
+
],
|
| 798 |
+
"265": [
|
| 799 |
+
8.100543403625489
|
| 800 |
+
],
|
| 801 |
+
"266": [
|
| 802 |
+
8.234585952758788
|
| 803 |
+
],
|
| 804 |
+
"267": [
|
| 805 |
+
8.491876983642578
|
| 806 |
+
],
|
| 807 |
+
"268": [
|
| 808 |
+
8.587455749511719
|
| 809 |
+
],
|
| 810 |
+
"269": [
|
| 811 |
+
8.082306098937988
|
| 812 |
+
],
|
| 813 |
+
"270": [
|
| 814 |
+
8.348917007446289
|
| 815 |
+
],
|
| 816 |
+
"271": [
|
| 817 |
+
8.372463989257813
|
| 818 |
+
],
|
| 819 |
+
"272": [
|
| 820 |
+
8.237805128097534
|
| 821 |
+
],
|
| 822 |
+
"273": [
|
| 823 |
+
8.354072761535644
|
| 824 |
+
],
|
| 825 |
+
"274": [
|
| 826 |
+
8.235678354899088
|
| 827 |
+
],
|
| 828 |
+
"275": [
|
| 829 |
+
8.407945315043131
|
| 830 |
+
],
|
| 831 |
+
"276": [
|
| 832 |
+
8.404786944389343
|
| 833 |
+
],
|
| 834 |
+
"277": [
|
| 835 |
+
8.70421314239502
|
| 836 |
+
],
|
| 837 |
+
"278": [
|
| 838 |
+
8.071562131245932
|
| 839 |
+
],
|
| 840 |
+
"279": [
|
| 841 |
+
8.511271953582764
|
| 842 |
+
],
|
| 843 |
+
"280": [
|
| 844 |
+
8.091069221496582
|
| 845 |
+
],
|
| 846 |
+
"281": [
|
| 847 |
+
8.105241934458414
|
| 848 |
+
],
|
| 849 |
+
"282": [
|
| 850 |
+
8.074981212615967
|
| 851 |
+
],
|
| 852 |
+
"283": [
|
| 853 |
+
8.298959159851075
|
| 854 |
+
],
|
| 855 |
+
"284": [
|
| 856 |
+
8.066243092219034
|
| 857 |
+
],
|
| 858 |
+
"285": [
|
| 859 |
+
8.178271770477295
|
| 860 |
+
],
|
| 861 |
+
"286": [
|
| 862 |
+
8.293231010437012
|
| 863 |
+
],
|
| 864 |
+
"287": [
|
| 865 |
+
8.43751049041748
|
| 866 |
+
],
|
| 867 |
+
"288": [
|
| 868 |
+
8.105303128560385
|
| 869 |
+
],
|
| 870 |
+
"289": [
|
| 871 |
+
8.421969032287597
|
| 872 |
+
],
|
| 873 |
+
"290": [
|
| 874 |
+
8.30833911895752
|
| 875 |
+
],
|
| 876 |
+
"291": [
|
| 877 |
+
8.0765008131663
|
| 878 |
+
],
|
| 879 |
+
"292": [
|
| 880 |
+
8.021388053894043
|
| 881 |
+
],
|
| 882 |
+
"293": [
|
| 883 |
+
8.335704485575357
|
| 884 |
+
],
|
| 885 |
+
"294": [
|
| 886 |
+
8.045191287994385
|
| 887 |
+
],
|
| 888 |
+
"295": [
|
| 889 |
+
7.93108606338501
|
| 890 |
+
],
|
| 891 |
+
"296": [
|
| 892 |
+
7.992374897003174
|
| 893 |
+
],
|
| 894 |
+
"297": [
|
| 895 |
+
8.036834875742594
|
| 896 |
+
],
|
| 897 |
+
"298": [
|
| 898 |
+
7.984613704681396
|
| 899 |
+
],
|
| 900 |
+
"299": [
|
| 901 |
+
7.9923395156860355
|
| 902 |
+
],
|
| 903 |
+
"300": [
|
| 904 |
+
8.048283497492472
|
| 905 |
+
],
|
| 906 |
+
"301": [
|
| 907 |
+
8.485947370529175
|
| 908 |
+
],
|
| 909 |
+
"302": [
|
| 910 |
+
8.025302092234293
|
| 911 |
+
],
|
| 912 |
+
"303": [
|
| 913 |
+
7.875656485557556
|
| 914 |
+
],
|
| 915 |
+
"304": [
|
| 916 |
+
8.240285038948059
|
| 917 |
+
],
|
| 918 |
+
"305": [
|
| 919 |
+
8.169192552566528
|
| 920 |
+
],
|
| 921 |
+
"306": [
|
| 922 |
+
8.01096134185791
|
| 923 |
+
],
|
| 924 |
+
"307": [
|
| 925 |
+
7.814367453257243
|
| 926 |
+
],
|
| 927 |
+
"308": [
|
| 928 |
+
8.359534621238708
|
| 929 |
+
],
|
| 930 |
+
"309": [
|
| 931 |
+
8.128613948822021
|
| 932 |
+
],
|
| 933 |
+
"310": [
|
| 934 |
+
8.132676696777343
|
| 935 |
+
],
|
| 936 |
+
"311": [
|
| 937 |
+
7.703763484954834
|
| 938 |
+
],
|
| 939 |
+
"312": [
|
| 940 |
+
7.964991569519043
|
| 941 |
+
],
|
| 942 |
+
"313": [
|
| 943 |
+
8.09695291519165
|
| 944 |
+
],
|
| 945 |
+
"314": [
|
| 946 |
+
7.946078491210938
|
| 947 |
+
],
|
| 948 |
+
"315": [
|
| 949 |
+
7.795873982565744
|
| 950 |
+
],
|
| 951 |
+
"316": [
|
| 952 |
+
8.114620049794516
|
| 953 |
+
],
|
| 954 |
+
"317": [
|
| 955 |
+
7.781284264155796
|
| 956 |
+
],
|
| 957 |
+
"318": [
|
| 958 |
+
8.108832359313965
|
| 959 |
+
],
|
| 960 |
+
"319": [
|
| 961 |
+
8.14557377497355
|
| 962 |
+
],
|
| 963 |
+
"320": [
|
| 964 |
+
8.058723449707031
|
| 965 |
+
],
|
| 966 |
+
"321": [
|
| 967 |
+
8.213569736480713
|
| 968 |
+
],
|
| 969 |
+
"322": [
|
| 970 |
+
7.698760986328125
|
| 971 |
+
],
|
| 972 |
+
"323": [
|
| 973 |
+
7.998951315879822
|
| 974 |
+
],
|
| 975 |
+
"324": [
|
| 976 |
+
7.742861986160278
|
| 977 |
+
],
|
| 978 |
+
"325": [
|
| 979 |
+
7.954373073577881
|
| 980 |
+
],
|
| 981 |
+
"326": [
|
| 982 |
+
7.918167591094971
|
| 983 |
+
],
|
| 984 |
+
"327": [
|
| 985 |
+
8.006525897979737
|
| 986 |
+
],
|
| 987 |
+
"328": [
|
| 988 |
+
7.668278789520263
|
| 989 |
+
],
|
| 990 |
+
"329": [
|
| 991 |
+
8.08655297756195
|
| 992 |
+
],
|
| 993 |
+
"330": [
|
| 994 |
+
7.91127290725708
|
| 995 |
+
],
|
| 996 |
+
"331": [
|
| 997 |
+
7.696333885192871
|
| 998 |
+
],
|
| 999 |
+
"332": [
|
| 1000 |
+
7.65695583820343
|
| 1001 |
+
],
|
| 1002 |
+
"333": [
|
| 1003 |
+
8.066210746765137
|
| 1004 |
+
],
|
| 1005 |
+
"334": [
|
| 1006 |
+
7.964347243309021
|
| 1007 |
+
],
|
| 1008 |
+
"335": [
|
| 1009 |
+
7.954415321350098
|
| 1010 |
+
],
|
| 1011 |
+
"336": [
|
| 1012 |
+
7.868668556213379
|
| 1013 |
+
],
|
| 1014 |
+
"337": [
|
| 1015 |
+
7.752981662750244
|
| 1016 |
+
],
|
| 1017 |
+
"338": [
|
| 1018 |
+
7.988874117533366
|
| 1019 |
+
],
|
| 1020 |
+
"339": [
|
| 1021 |
+
7.646774482727051
|
| 1022 |
+
],
|
| 1023 |
+
"340": [
|
| 1024 |
+
7.754316425323486
|
| 1025 |
+
],
|
| 1026 |
+
"341": [
|
| 1027 |
+
7.727629899978638
|
| 1028 |
+
],
|
| 1029 |
+
"342": [
|
| 1030 |
+
8.081591129302979
|
| 1031 |
+
],
|
| 1032 |
+
"343": [
|
| 1033 |
+
8.093174934387207
|
| 1034 |
+
],
|
| 1035 |
+
"344": [
|
| 1036 |
+
7.799541187286377
|
| 1037 |
+
],
|
| 1038 |
+
"345": [
|
| 1039 |
+
7.860105419158936
|
| 1040 |
+
],
|
| 1041 |
+
"346": [
|
| 1042 |
+
7.771262836456299
|
| 1043 |
+
],
|
| 1044 |
+
"347": [
|
| 1045 |
+
7.807041168212891
|
| 1046 |
+
],
|
| 1047 |
+
"348": [
|
| 1048 |
+
7.724535584449768
|
| 1049 |
+
],
|
| 1050 |
+
"349": [
|
| 1051 |
+
7.576266288757324
|
| 1052 |
+
],
|
| 1053 |
+
"350": [
|
| 1054 |
+
7.5733345576695035
|
| 1055 |
+
],
|
| 1056 |
+
"351": [
|
| 1057 |
+
7.8062320947647095
|
| 1058 |
+
],
|
| 1059 |
+
"352": [
|
| 1060 |
+
7.669395923614502
|
| 1061 |
+
],
|
| 1062 |
+
"353": [
|
| 1063 |
+
7.868735027313233
|
| 1064 |
+
],
|
| 1065 |
+
"354": [
|
| 1066 |
+
7.829128563404083
|
| 1067 |
+
],
|
| 1068 |
+
"355": [
|
| 1069 |
+
7.602943658828735
|
| 1070 |
+
],
|
| 1071 |
+
"356": [
|
| 1072 |
+
7.92758321762085
|
| 1073 |
+
],
|
| 1074 |
+
"357": [
|
| 1075 |
+
7.628891547520955
|
| 1076 |
+
],
|
| 1077 |
+
"358": [
|
| 1078 |
+
8.02551555633545
|
| 1079 |
+
],
|
| 1080 |
+
"359": [
|
| 1081 |
+
7.746890226999919
|
| 1082 |
+
],
|
| 1083 |
+
"360": [
|
| 1084 |
+
7.8968634605407715
|
| 1085 |
+
],
|
| 1086 |
+
"361": [
|
| 1087 |
+
7.753103494644165
|
| 1088 |
+
],
|
| 1089 |
+
"362": [
|
| 1090 |
+
7.334808553968157
|
| 1091 |
+
],
|
| 1092 |
+
"363": [
|
| 1093 |
+
7.754158973693848
|
| 1094 |
+
],
|
| 1095 |
+
"364": [
|
| 1096 |
+
7.697373867034912
|
| 1097 |
+
],
|
| 1098 |
+
"365": [
|
| 1099 |
+
7.373909632364909
|
| 1100 |
+
],
|
| 1101 |
+
"366": [
|
| 1102 |
+
7.343849062919617
|
| 1103 |
+
],
|
| 1104 |
+
"367": [
|
| 1105 |
+
8.091873486836752
|
| 1106 |
+
],
|
| 1107 |
+
"368": [
|
| 1108 |
+
7.612311840057373
|
| 1109 |
+
],
|
| 1110 |
+
"369": [
|
| 1111 |
+
7.7113198439280195
|
| 1112 |
+
],
|
| 1113 |
+
"370": [
|
| 1114 |
+
7.706414580345154
|
| 1115 |
+
],
|
| 1116 |
+
"371": [
|
| 1117 |
+
7.664455056190491
|
| 1118 |
+
],
|
| 1119 |
+
"372": [
|
| 1120 |
+
7.630658054351807
|
| 1121 |
+
],
|
| 1122 |
+
"373": [
|
| 1123 |
+
7.412530779838562
|
| 1124 |
+
],
|
| 1125 |
+
"374": [
|
| 1126 |
+
7.605931639671326
|
| 1127 |
+
],
|
| 1128 |
+
"375": [
|
| 1129 |
+
8.049162983894348
|
| 1130 |
+
],
|
| 1131 |
+
"376": [
|
| 1132 |
+
7.7938069105148315
|
| 1133 |
+
],
|
| 1134 |
+
"377": [
|
| 1135 |
+
7.814945062001546
|
| 1136 |
+
],
|
| 1137 |
+
"378": [
|
| 1138 |
+
7.6603734493255615
|
| 1139 |
+
],
|
| 1140 |
+
"379": [
|
| 1141 |
+
7.516097784042358
|
| 1142 |
]
|
| 1143 |
},
|
| 1144 |
"distributed/optimized-gpt2-250m-v0.1.1": {
|