source: other-projects/maori-lang-detection/mongodb-data/1b_counts_noMiInUrlPath.json@ 33848

Last change on this file since 33848 was 33848, checked in by ak19, 4 years ago

Tables of mongodb counts (1-5 table) and manual counts (6table). GeoJSON maps for number of web PAGES in MRI and containing MRI.

File size: 2.2 KB
Line 
1/*
2All crawled sites which don't contain mi (mi.* or */mi) in the URL path.
3
4db.Websites.aggregate([
5 { $match: {urlContainsLangCodeInPath: false} },
6 { $unwind: "$geoLocationCountryCode" },
7 {
8 $group: {
9 _id: "$geoLocationCountryCode",
10 count: { $sum: 1 }
11 }
12 },
13 { $sort : { count : -1} }
14]);
15*/
16
17/* 1 */
18{
19 "_id" : "us",
20 "count" : 288.0
21}
22
23/* 2 */
24{
25 "_id" : "unknown",
26 "count" : 154.0
27}
28
29/* 3 */
30{
31 "_id" : "nz",
32 "count" : 101.0
33}
34
35/* 4 */
36{
37 "_id" : "de",
38 "count" : 40.0
39}
40
41/* 5 */
42{
43 "_id" : "au",
44 "count" : 36.0
45}
46
47/* 6 */
48{
49 "_id" : "fr",
50 "count" : 35.0
51}
52
53/* 7 */
54{
55 "_id" : "nl",
56 "count" : 24.0
57}
58
59/* 8 */
60{
61 "_id" : "gb",
62 "count" : 13.0
63}
64
65/* 9 */
66{
67 "_id" : "ca",
68 "count" : 12.0
69}
70
71/* 10 */
72{
73 "_id" : "dk",
74 "count" : 8.0
75}
76
77/* 11 */
78{
79 "_id" : "es",
80 "count" : 7.0
81}
82
83/* 12 */
84{
85 "_id" : "cz",
86 "count" : 6.0
87}
88
89/* 13 */
90{
91 "_id" : "jp",
92 "count" : 5.0
93}
94
95/* 14 */
96{
97 "_id" : "it",
98 "count" : 4.0
99}
100
101/* 15 */
102{
103 "_id" : "in",
104 "count" : 3.0
105}
106
107/* 16 */
108{
109 "_id" : "ie",
110 "count" : 3.0
111}
112
113/* 17 */
114{
115 "_id" : "at",
116 "count" : 3.0
117}
118
119/* 18 */
120{
121 "_id" : "ro",
122 "count" : 3.0
123}
124
125/* 19 */
126{
127 "_id" : "ru",
128 "count" : 3.0
129}
130
131/* 20 */
132{
133 "_id" : "se",
134 "count" : 3.0
135}
136
137/* 21 */
138{
139 "_id" : "ch",
140 "count" : 3.0
141}
142
143/* 22 */
144{
145 "_id" : "il",
146 "count" : 3.0
147}
148
149/* 23 */
150{
151 "_id" : "pl",
152 "count" : 2.0
153}
154
155/* 24 */
156{
157 "_id" : "ck",
158 "count" : 2.0
159}
160
161/* 25 */
162{
163 "_id" : "cn",
164 "count" : 2.0
165}
166
167/* 26 */
168{
169 "_id" : "sg",
170 "count" : 1.0
171}
172
173/* 27 */
174{
175 "_id" : "mx",
176 "count" : 1.0
177}
178
179/* 28 */
180{
181 "_id" : "io",
182 "count" : 1.0
183}
184
185/* 29 */
186{
187 "_id" : "za",
188 "count" : 1.0
189}
190
191/* 30 */
192{
193 "_id" : "ir",
194 "count" : 1.0
195}
196
197/* 31 */
198{
199 "_id" : "ua",
200 "count" : 1.0
201}
202
203/* 32 */
204{
205 "_id" : "bg",
206 "count" : 1.0
207}
208
209/* 33 */
210{
211 "_id" : "gr",
212 "count" : 1.0
213}
214
215/* 34 */
216{
217 "_id" : "fi",
218 "count" : 1.0
219}
220
221/* 35 */
222{
223 "_id" : "me",
224 "count" : 1.0
225}
226
227/* 36 */
228{
229 "_id" : "pf",
230 "count" : 1.0
231}
232
233/* 37 */
234{
235 "_id" : "pt",
236 "count" : 1.0
237}
238
Note: See TracBrowser for help on using the repository browser.