1
1
{
2
- "dialects" : {
3
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/dialects.zip" ,
4
- "signature" : " 0e6767047e05f618560d097dfa0587530636c52fc19507c087bdff556b389489"
2
+ "aegis-sample" : {
3
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/aegis-sample.zip" ,
4
+ "signature" : " a2b3ae9c5a19833cc594fc4c14a6bfce35ab9c6086f0c2836d2719ab788119bd" ,
5
+ "size" : {
6
+ "compressed" : 916334 ,
7
+ "decompressed" : 2878359
8
+ },
9
+ "instances" : 3030
5
10
},
6
- "lowlight" : {
7
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/lowlight.zip" ,
8
- "signature" : " ddc36eb7f0443efa5e71939e503d0834fd48451281d9658d5cb7ead30143b98f"
11
+ "aegis" : {
12
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/aegis.zip" ,
13
+ "signature" : " c846f20d893461525839cd2f61f85faf0dcbff03e1998fd8f747506ff65bec69" ,
14
+ "size" : {
15
+ "compressed" : 3619910 ,
16
+ "decompressed" : 11362916
17
+ },
18
+ "instances" : 11997
9
19
},
10
20
"dialects-sample" : {
11
21
"url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/dialects-sample.zip" ,
12
- "signature" : " 9e9509f4d82468c896bede36b16c6de218a1dce28a56ae49d1fb75933bf770c5"
13
- },
14
- "reddit" : {
15
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/reddit.zip" ,
16
- "signature" : " d97419403f0d940970b2542d5b188570dacedae3c2a68ada3520cfa95c52f75c"
22
+ "signature" : " 9e9509f4d82468c896bede36b16c6de218a1dce28a56ae49d1fb75933bf770c5" ,
23
+ "size" : {
24
+ "compressed" : 243136640 ,
25
+ "decompressed" : 356704802
26
+ },
27
+ "instances" : 1785 ,
28
+ "classes" : {
29
+ "northern_male" : 203 ,
30
+ "southern_female" : 417 ,
31
+ "northern_female" : 65 ,
32
+ "irish_male" : 48 ,
33
+ "scottish_male" : 172 ,
34
+ "welsh_female" : 120 ,
35
+ "southern_male" : 436 ,
36
+ "midlands_female" : 24 ,
37
+ "midlands_male" : 51 ,
38
+ "welsh_male" : 157 ,
39
+ "scottish_female" : 92
40
+ }
17
41
},
18
- "movies-sample" : {
19
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/movies-sample.zip" ,
20
- "signature" : " 2d3d9294ad875e7489db94fc2ab02c1ad6dfdc15a2bf1a5037be36a6defc8168"
42
+ "dialects" : {
43
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/dialects.zip" ,
44
+ "signature" : " 0e6767047e05f618560d097dfa0587530636c52fc19507c087bdff556b389489" ,
45
+ "size" : {
46
+ "compressed" : 2466918919 ,
47
+ "decompressed" : 3605272328
48
+ },
49
+ "instances" : 17877 ,
50
+ "classes" : {
51
+ "northern_male" : 2097 ,
52
+ "southern_female" : 4161 ,
53
+ "northern_female" : 750 ,
54
+ "irish_male" : 450 ,
55
+ "scottish_male" : 1649 ,
56
+ "welsh_female" : 1199 ,
57
+ "southern_male" : 4331 ,
58
+ "midlands_female" : 246 ,
59
+ "midlands_male" : 450 ,
60
+ "welsh_male" : 1650 ,
61
+ "scottish_female" : 894
62
+ }
21
63
},
22
64
"essays-sample" : {
23
65
"url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/essays-sample.zip" ,
24
- "signature" : " a77fc1c2c2718d79132598e6c873fd5b08c40c2e4049d995317747fb76b96631"
25
- },
26
- "aegis-sample" : {
27
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/aegis-sample.zip" ,
28
- "signature" : " a2b3ae9c5a19833cc594fc4c14a6bfce35ab9c6086f0c2836d2719ab788119bd"
29
- },
30
- "aegis" : {
31
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/aegis.zip" ,
32
- "signature" : " c846f20d893461525839cd2f61f85faf0dcbff03e1998fd8f747506ff65bec69"
33
- },
34
- "nsfw-sample" : {
35
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/nsfw-sample.zip" ,
36
- "signature" : " d5044f30769d3a6e9ba639312120dc955bdfcf4d8aa8a6f3ee493334644b9fcd"
66
+ "signature" : " a77fc1c2c2718d79132598e6c873fd5b08c40c2e4049d995317747fb76b96631" ,
67
+ "size" : {
68
+ "compressed" : 1796330 ,
69
+ "decompressed" : 8785856
70
+ },
71
+ "instances" : 512
37
72
},
38
73
"essays" : {
39
74
"url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/essays.zip" ,
40
- "signature" : " 3a7b260dd5baec9134c7398ac7b9b297d7b1a387bce1a9f99cd8d3e0a7ceb9cc"
41
- },
42
- "reddit-sample" : {
43
- "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/reddit-sample.zip" ,
44
- "signature" : " 24088c648b8c3497d0b682102c3fa965d46ca22abe8f94695287e09bf82db991"
75
+ "signature" : " 3a7b260dd5baec9134c7398ac7b9b297d7b1a387bce1a9f99cd8d3e0a7ceb9cc" ,
76
+ "size" : {
77
+ "compressed" : 7116584 ,
78
+ "decompressed" : 35516576
79
+ },
80
+ "instances" : 2078
45
81
},
46
82
"lowlight-sample" : {
47
83
"url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/lowlight-sample.zip" ,
48
- "signature" : " f34bafa588441b8e240b0932e9ac446d9f805bdfdb22640c036c441258220eaf"
84
+ "signature" : " f34bafa588441b8e240b0932e9ac446d9f805bdfdb22640c036c441258220eaf" ,
85
+ "size" : {
86
+ "compressed" : 166217847 ,
87
+ "decompressed" : 166608858
88
+ },
89
+ "instances" : 475 ,
90
+ "classes" : {
91
+ "high" : 242 ,
92
+ "low" : 233
93
+ }
94
+ },
95
+ "lowlight" : {
96
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/lowlight.zip" ,
97
+ "signature" : " ddc36eb7f0443efa5e71939e503d0834fd48451281d9658d5cb7ead30143b98f" ,
98
+ "size" : {
99
+ "compressed" : 347470078 ,
100
+ "decompressed" : 348256471
101
+ },
102
+ "instances" : 1000 ,
103
+ "classes" : {
104
+ "high" : 500 ,
105
+ "low" : 500
106
+ }
107
+ },
108
+ "movies-sample" : {
109
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/movies-sample.zip" ,
110
+ "signature" : " 2d3d9294ad875e7489db94fc2ab02c1ad6dfdc15a2bf1a5037be36a6defc8168" ,
111
+ "size" : {
112
+ "compressed" : 381174092 ,
113
+ "decompressed" : 387776108
114
+ },
115
+ "instances" : 5465 ,
116
+ "classes" : {
117
+ "movies" : 5465
118
+ }
49
119
},
50
120
"movies" : {
51
121
"url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/movies.zip" ,
52
- "signature" : " 618f7aa8aa103192ee8b76fc701ff182b2a41e5e78675a4d6af707e490d36f45"
122
+ "signature" : " 618f7aa8aa103192ee8b76fc701ff182b2a41e5e78675a4d6af707e490d36f45" ,
123
+ "size" : {
124
+ "compressed" : 7351355869 ,
125
+ "decompressed" : 7479027563
126
+ },
127
+ "instances" : 106844 ,
128
+ "classes" : {
129
+ "movies" : 106844
130
+ }
131
+ },
132
+ "nsfw-sample" : {
133
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/nsfw-sample.zip" ,
134
+ "signature" : " d5044f30769d3a6e9ba639312120dc955bdfcf4d8aa8a6f3ee493334644b9fcd" ,
135
+ "size" : {
136
+ "compressed" : 6429140 ,
137
+ "decompressed" : 6535438
138
+ },
139
+ "instances" : 53 ,
140
+ "classes" : {
141
+ "safe" : 28 ,
142
+ "nsfw" : 25
143
+ }
53
144
},
54
145
"nsfw" : {
55
146
"url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/nsfw.zip" ,
56
- "signature" : " 7ac498e8f17428c51a5c8c366aaf10b47663a9eb8a560fd8abe01366eaf60139"
147
+ "signature" : " 7ac498e8f17428c51a5c8c366aaf10b47663a9eb8a560fd8abe01366eaf60139" ,
148
+ "size" : {
149
+ "compressed" : 27937058 ,
150
+ "decompressed" : 28266876
151
+ },
152
+ "instances" : 215 ,
153
+ "classes" : {
154
+ "safe" : 108 ,
155
+ "nsfw" : 107
156
+ }
157
+ },
158
+ "reddit-sample" : {
159
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/reddit-sample.zip" ,
160
+ "signature" : " 24088c648b8c3497d0b682102c3fa965d46ca22abe8f94695287e09bf82db991" ,
161
+ "size" : {
162
+ "compressed" : 63979 ,
163
+ "decompressed" : 278734
164
+ },
165
+ "instances" : 957
166
+ },
167
+ "reddit" : {
168
+ "url" : " https://storage.googleapis.com/construe/v0.3.0/datasets/reddit.zip" ,
169
+ "signature" : " d97419403f0d940970b2542d5b188570dacedae3c2a68ada3520cfa95c52f75c" ,
170
+ "size" : {
171
+ "compressed" : 244363 ,
172
+ "decompressed" : 1117785
173
+ },
174
+ "instances" : 3844
57
175
}
58
176
}
0 commit comments