pelias / api

HTTP API for Pelias Geocoder
http://pelias.io
MIT License
218 stars 162 forks source link

address deduplication testcase #1385

Open missinglink opened 4 years ago

missinglink commented 4 years ago

The following three addresses are almost identical but are not being deduped:

https://pelias.github.io/compare/#/v1/search%3Ftext=190%20dean%20street%20brooklyn

Screenshot 2019-11-14 at 11 07 16
"features": [
    {
      "type": "Feature",
      "geometry": {
        "type": "Point",
        "coordinates": [
          -73.98587,
          40.685617
        ]
      },
      "properties": {
        "id": "us/ny/city_of_new_york:0dea5df48834ec24",
        "gid": "openaddresses:address:us/ny/city_of_new_york:0dea5df48834ec24",
        "layer": "address",
        "source": "openaddresses",
        "source_id": "us/ny/city_of_new_york:0dea5df48834ec24",
        "name": "190 Dean St",
        "housenumber": "190",
        "street": "Dean St",
        "postalcode": "11217",
        "confidence": 1,
        "match_type": "exact",
        "accuracy": "point",
        "country": "United States",
        "country_gid": "whosonfirst:country:85633793",
        "country_a": "USA",
        "region": "New York",
        "region_gid": "whosonfirst:region:85688543",
        "region_a": "NY",
        "county": "Kings County",
        "county_gid": "whosonfirst:county:102082361",
        "county_a": "KI",
        "locality": "New York",
        "locality_gid": "whosonfirst:locality:85977539",
        "locality_a": "NYC",
        "borough": "Brooklyn",
        "borough_gid": "whosonfirst:borough:421205765",
        "neighbourhood": "Boerum Hill",
        "neighbourhood_gid": "whosonfirst:neighbourhood:85869125",
        "continent": "North America",
        "continent_gid": "whosonfirst:continent:102191575",
        "label": "190 Dean St, Brooklyn, New York, NY, USA"
      }
    },
    {
      "type": "Feature",
      "geometry": {
        "type": "Point",
        "coordinates": [
          -73.985859,
          40.685613
        ]
      },
      "properties": {
        "id": "node/2664302423",
        "gid": "openstreetmap:address:node/2664302423",
        "layer": "address",
        "source": "openstreetmap",
        "source_id": "node/2664302423",
        "name": "190 Dean Street",
        "housenumber": "190",
        "street": "Dean Street",
        "postalcode": "11201",
        "confidence": 1,
        "match_type": "exact",
        "accuracy": "point",
        "country": "United States",
        "country_gid": "whosonfirst:country:85633793",
        "country_a": "USA",
        "region": "New York",
        "region_gid": "whosonfirst:region:85688543",
        "region_a": "NY",
        "county": "Kings County",
        "county_gid": "whosonfirst:county:102082361",
        "county_a": "KI",
        "locality": "New York",
        "locality_gid": "whosonfirst:locality:85977539",
        "locality_a": "NYC",
        "borough": "Brooklyn",
        "borough_gid": "whosonfirst:borough:421205765",
        "neighbourhood": "Boerum Hill",
        "neighbourhood_gid": "whosonfirst:neighbourhood:85869125",
        "continent": "North America",
        "continent_gid": "whosonfirst:continent:102191575",
        "label": "190 Dean Street, Brooklyn, New York, NY, USA"
      }
    },
    {
      "type": "Feature",
      "geometry": {
        "type": "Point",
        "coordinates": [
          -73.98587,
          40.685617
        ]
      },
      "properties": {
        "id": "node/2550066407",
        "gid": "openstreetmap:address:node/2550066407",
        "layer": "address",
        "source": "openstreetmap",
        "source_id": "node/2550066407",
        "name": "190 Dean Street",
        "housenumber": "190",
        "street": "Dean Street",
        "postalcode": "11217",
        "confidence": 1,
        "match_type": "exact",
        "accuracy": "point",
        "country": "United States",
        "country_gid": "whosonfirst:country:85633793",
        "country_a": "USA",
        "region": "New York",
        "region_gid": "whosonfirst:region:85688543",
        "region_a": "NY",
        "county": "Kings County",
        "county_gid": "whosonfirst:county:102082361",
        "county_a": "KI",
        "locality": "New York",
        "locality_gid": "whosonfirst:locality:85977539",
        "locality_a": "NYC",
        "borough": "Brooklyn",
        "borough_gid": "whosonfirst:borough:421205765",
        "neighbourhood": "Boerum Hill",
        "neighbourhood_gid": "whosonfirst:neighbourhood:85869125",
        "continent": "North America",
        "continent_gid": "whosonfirst:continent:102191575",
        "label": "190 Dean Street, Brooklyn, New York, NY, USA"
      }
    }
  ]
missinglink commented 4 years ago

Here's a similar issue caused by lack of synonym support for street suffixes:

Screenshot 2019-11-14 at 11 15 44
missinglink commented 4 years ago

Screenshot 2019-11-15 at 12 58 55

missinglink commented 4 years ago

potential dupe of https://github.com/pelias/pelias/issues/438