Ignore:
Timestamp:
2019-12-18T21:38:44+13:00 (4 years ago)
Author:
ak19
Message:

With the bugfix from yesterday and the inclusion of http(s):mi.* type URLs in setting the Websites mongodb collection's urlContainsLangCodeInPath property, and updated/improved mongodb queries and their results I have now regenerated the latest geojson json data and maps.

File:
1 edited

Legend:

Unmodified
Added
Removed
  • other-projects/maori-lang-detection/mongodb-data/counts_sitesWithPagesInMRI.json

    r33805 r33813  
     1/*
     2Number of websites that have 1 or more pages detected as being in Maori, a positive numPagesInMRI.
     3
     4db.getCollection('Websites').find({numPagesInMRI: { $gt: 0}}).count()
     5= 361
     6
     7Count of country codes for sites that have at least one page detected as MRI:
     8
     9db.Websites.aggregate([
     10    {
     11        $match: {
     12            numPagesInMRI: {$gt: 0}
     13        }
     14    },
     15    { $unwind: "$geoLocationCountryCode" },
     16    {
     17        $group: {
     18            _id: {$toLower: '$geoLocationCountryCode'},
     19            count: { $sum: 1 }
     20        }
     21    },
     22    { $sort : { count : -1} }
     23]);
     24*/
     25
    126/* 1 */
    227{
    328    "_id" : "us",
    4     "count" : 207.0
     29    "count" : 206.0
    530}
    631
     
    4974/* 9 */
    5075{
    51     "_id" : "ca",
    52     "count" : 4.0
     76    "_id" : "gb",
     77    "count" : 3.0
    5378}
    5479
    5580/* 10 */
    5681{
    57     "_id" : "gb",
     82    "_id" : "ca",
    5883    "count" : 3.0
    5984}
     
    6186/* 11 */
    6287{
    63     "_id" : "ie",
     88    "_id" : "ua",
    6489    "count" : 2.0
    6590}
     
    6792/* 12 */
    6893{
    69     "_id" : "ua",
     94    "_id" : "ie",
    7095    "count" : 2.0
    7196}
     
    80105{
    81106    "_id" : "sg",
     107    "count" : 2.0
     108}
     109
     110/* 15 */
     111{
     112    "_id" : "unknown",
     113    "count" : 2.0
     114}
     115
     116/* 16 */
     117{
     118    "_id" : "gr",
    82119    "count" : 1.0
    83120}
    84121
    85 /* 15 */
     122/* 17 */
     123{
     124    "_id" : "hk",
     125    "count" : 1.0
     126}
     127
     128/* 18 */
     129{
     130    "_id" : "jp",
     131    "count" : 1.0
     132}
     133
     134/* 19 */
     135{
     136    "_id" : "bg",
     137    "count" : 1.0
     138}
     139
     140/* 20 */
    86141{
    87142    "_id" : "mx",
     
    89144}
    90145
    91 /* 16 */
     146/* 21 */
    92147{
    93     "_id" : "hk",
     148    "_id" : "ro",
    94149    "count" : 1.0
    95150}
    96 
    97 /* 17 */
    98 {
    99     "_id" : "jp",
    100     "count" : 1.0
    101 }
    102 
    103 /* 18 */
    104 {
    105     "_id" : "se",
    106     "count" : 1.0
    107 }
    108 
    109 /* 19 */
    110 {
    111     "_id" : "gr",
    112     "count" : 1.0
    113 }
    114 
    115 /* 20 */
    116 {
    117     "_id" : "unknown",
    118     "count" : 1.0
    119 }
    120 
    121 /* 21 */
    122 {
    123     "_id" : "bg",
    124     "count" : 1.0
    125 }
Note: See TracChangeset for help on using the changeset viewer.