[addresses] Spanish sub-building component probabilities
This commit is contained in:
@@ -3,6 +3,64 @@
|
|||||||
# Note: make Latin-American conventions by default (country overrides for Spain
|
# Note: make Latin-American conventions by default (country overrides for Spain
|
||||||
# as well as any other country-specific norms)
|
# as well as any other country-specific norms)
|
||||||
|
|
||||||
|
components:
|
||||||
|
po_box:
|
||||||
|
null_probability: 0.9
|
||||||
|
alphanumeric_probability: 0.1
|
||||||
|
conditional:
|
||||||
|
- component: level
|
||||||
|
probabilities:
|
||||||
|
null_probability: 0.995
|
||||||
|
alphanumeric_probability: 0.005
|
||||||
|
- component: unit
|
||||||
|
probabilities:
|
||||||
|
null_probability: 0.99
|
||||||
|
alphanumeric_probability: 0.01
|
||||||
|
- component: staircase
|
||||||
|
probabilities:
|
||||||
|
null_probability: 0.999
|
||||||
|
alphanumeric_probability: 0.001
|
||||||
|
- component: entrance
|
||||||
|
probabilities:
|
||||||
|
null_probability: 0.999
|
||||||
|
alphanumeric_probability: 0.001
|
||||||
|
|
||||||
|
level:
|
||||||
|
# If no floor number is specified
|
||||||
|
null_probability: 0.6
|
||||||
|
alphanumeric_probability: 0.35
|
||||||
|
standalone_probability: 0.05
|
||||||
|
|
||||||
|
staircase:
|
||||||
|
null_probability: 0.989
|
||||||
|
alphanumeric_probability: 0.01
|
||||||
|
directional_probability: 0.001
|
||||||
|
|
||||||
|
entrance:
|
||||||
|
null_probability: 0.9999
|
||||||
|
alphanumeric_probability: 0.0001
|
||||||
|
|
||||||
|
unit:
|
||||||
|
# If no unit number is specified
|
||||||
|
null_probability: 0.3
|
||||||
|
alphanumeric_probability: 0.65
|
||||||
|
standalone_probability: 0.05
|
||||||
|
|
||||||
|
combinations:
|
||||||
|
level_unit:
|
||||||
|
components:
|
||||||
|
- level
|
||||||
|
- unit
|
||||||
|
label: unit
|
||||||
|
separators:
|
||||||
|
- separator: /
|
||||||
|
probability: 0.2
|
||||||
|
- separator: " "
|
||||||
|
probability: 0.6
|
||||||
|
- separator: " - "
|
||||||
|
probability: 0.2
|
||||||
|
probability: 0.005
|
||||||
|
|
||||||
numbers:
|
numbers:
|
||||||
default: &numero
|
default: &numero
|
||||||
canonical: número
|
canonical: número
|
||||||
@@ -198,10 +256,6 @@ levels:
|
|||||||
canonical_probability: 0.7
|
canonical_probability: 0.7
|
||||||
abbreviated_probability: 0.1
|
abbreviated_probability: 0.1
|
||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
numeric:
|
|
||||||
direction: left
|
|
||||||
numeric_probability: 0.4
|
|
||||||
standalone_probability: 0.6
|
|
||||||
sobreatico: &sobreatico
|
sobreatico: &sobreatico
|
||||||
canonical: sobreatico
|
canonical: sobreatico
|
||||||
aliases:
|
aliases:
|
||||||
@@ -251,17 +305,6 @@ levels:
|
|||||||
numeric_probability: 0.99
|
numeric_probability: 0.99
|
||||||
alpha_probability: 0.01
|
alpha_probability: 0.01
|
||||||
|
|
||||||
order:
|
|
||||||
# e.g. Calle Ruiz de Alarcón 23 piso 3
|
|
||||||
- after: house_number
|
|
||||||
probability: 0.8
|
|
||||||
# e.g. Piso 3, Museo del Prado, Calle Ruiz de Alarcón 23
|
|
||||||
- before: house
|
|
||||||
probability: 0.1
|
|
||||||
# e.g. Museo del Prado, Bajos, Calle Ruiz de Alarcón 23
|
|
||||||
- before: road
|
|
||||||
probability: 0.1
|
|
||||||
|
|
||||||
blocks:
|
blocks:
|
||||||
default:
|
default:
|
||||||
canonical: bloque
|
canonical: bloque
|
||||||
@@ -373,14 +416,10 @@ po_boxes:
|
|||||||
alpha_probability: 0.05 # Apdo A
|
alpha_probability: 0.05 # Apdo A
|
||||||
numeric_plus_alpha_probability: 0.04 # Apdo 123G
|
numeric_plus_alpha_probability: 0.04 # Apdo 123G
|
||||||
alpha_plus_numeric_probability: 0.01 # Apdo A123
|
alpha_plus_numeric_probability: 0.01 # Apdo A123
|
||||||
alpha_plus_numeric_whitespace_probability: 0.1
|
alpha_plus_numeric:
|
||||||
numeric_plus_alpha_whitespace_probability: 0.1
|
whitespace_probability: 0.1
|
||||||
|
numeric_plus_alpha:
|
||||||
order:
|
whitespace_probability: 0.1
|
||||||
- after: house
|
|
||||||
probability: 0.8
|
|
||||||
- before: house
|
|
||||||
probability: 0.2
|
|
||||||
|
|
||||||
postcodes:
|
postcodes:
|
||||||
alphanumeric:
|
alphanumeric:
|
||||||
@@ -535,7 +574,34 @@ entrances:
|
|||||||
canonical_probability: 0.5
|
canonical_probability: 0.5
|
||||||
abbreviated_probability: 0.2
|
abbreviated_probability: 0.2
|
||||||
sample_probability: 0.3
|
sample_probability: 0.3
|
||||||
|
numeric:
|
||||||
|
direction: left
|
||||||
|
|
||||||
|
# Entrance 1, Entrance A, etc.
|
||||||
|
alphanumeric:
|
||||||
|
default: *entrada
|
||||||
|
numeric_probability: 0.1 # e.g. Entrance 1
|
||||||
|
alpha_probability: 0.85 # e.g. Entrnace A
|
||||||
|
numeric_plus_alpha_probability: 0.025 # e.g. 1A
|
||||||
|
alpha_plus_numeric_probability: 0.025 # e.g. A1
|
||||||
|
|
||||||
|
alpha_plus_numeric:
|
||||||
|
whitespace_probability: 0.1
|
||||||
|
|
||||||
|
numeric_plus_alpha:
|
||||||
|
whitespace_probability: 0.1
|
||||||
|
|
||||||
|
directional:
|
||||||
|
modifier:
|
||||||
|
alternatives:
|
||||||
|
- alternative: *norte
|
||||||
|
- alternative: *sur
|
||||||
|
- alternative: *este
|
||||||
|
- alternative: *oeste
|
||||||
|
- alternative: *derecha
|
||||||
|
- alternative: *izquierda
|
||||||
|
- alternative: *trasera
|
||||||
|
- alternative: *frente
|
||||||
|
|
||||||
staircases:
|
staircases:
|
||||||
escalera: &escalera
|
escalera: &escalera
|
||||||
@@ -545,22 +611,38 @@ staircases:
|
|||||||
canonical_probability: 0.3
|
canonical_probability: 0.3
|
||||||
abbreviated_probability: 0.4
|
abbreviated_probability: 0.4
|
||||||
sample_probability: 0.3
|
sample_probability: 0.3
|
||||||
|
numeric:
|
||||||
|
direction: left
|
||||||
|
|
||||||
|
alphanumeric:
|
||||||
|
# For alphanumerics, Stair A, Stair 1, etc.
|
||||||
|
default: *escalera
|
||||||
|
numeric_probability: 0.6 # e.g. Escalera 1
|
||||||
|
alpha_probability: 0.35 # e.g. Escalera A
|
||||||
|
numeric_plus_alpha_probability: 0.025 # e.g. 1A
|
||||||
|
alpha_plus_numeric_probability: 0.025 # e.g. A1
|
||||||
|
|
||||||
|
alpha_plus_numeric:
|
||||||
|
whitespace_probability: 0.1
|
||||||
|
|
||||||
|
numeric_plus_alpha:
|
||||||
|
whitespace_probability: 0.1
|
||||||
|
|
||||||
|
directional:
|
||||||
|
direction: right # e.g. Escalera Izq
|
||||||
|
direction_probability: 0.8
|
||||||
|
modifier:
|
||||||
|
alternatives:
|
||||||
|
- alternative: *norte
|
||||||
|
- alternative: *sur
|
||||||
|
- alternative: *este
|
||||||
|
- alternative: *oeste
|
||||||
|
- alternative: *derecha
|
||||||
|
- alternative: *izquierda
|
||||||
|
- alternative: *trasera
|
||||||
|
- alternative: *frente
|
||||||
|
|
||||||
units:
|
units:
|
||||||
# Units are not part of the global address formats (and are not always standard)
|
|
||||||
# This is a list of places in the address where the unit line might go
|
|
||||||
order:
|
|
||||||
- before: house
|
|
||||||
probability: 0.05
|
|
||||||
- before: road
|
|
||||||
probability: 0.05
|
|
||||||
# e.g. Piso 3 Dpto 12 (most common)
|
|
||||||
- after: level
|
|
||||||
probability: 0.8
|
|
||||||
# e.g. Apto 6, 2o piso (less common)
|
|
||||||
- before: level
|
|
||||||
probability: 0.1
|
|
||||||
|
|
||||||
apartment: &apartamento
|
apartment: &apartamento
|
||||||
canonical: apartamento
|
canonical: apartamento
|
||||||
abbreviated: apto
|
abbreviated: apto
|
||||||
@@ -669,9 +751,7 @@ units:
|
|||||||
- alternative: *casa
|
- alternative: *casa
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
- alternative: *puerta
|
- alternative: *puerta
|
||||||
probability: 0.045
|
probability: 0.05
|
||||||
- alternative: *atico
|
|
||||||
probability: 0.005
|
|
||||||
|
|
||||||
# Separate random probability for adding directions like 2o Izq, 2 Dcha, etc.
|
# Separate random probability for adding directions like 2o Izq, 2 Dcha, etc.
|
||||||
add_direction: true
|
add_direction: true
|
||||||
@@ -683,8 +763,10 @@ units:
|
|||||||
numeric_plus_alpha_probability: 0.01 # e.g. Dpto 1A
|
numeric_plus_alpha_probability: 0.01 # e.g. Dpto 1A
|
||||||
alpha_plus_numeric_probability: 0.01 # e.g. Dpto A1
|
alpha_plus_numeric_probability: 0.01 # e.g. Dpto A1
|
||||||
alpha_probability: 0.08 # e.g. Dpto A
|
alpha_probability: 0.08 # e.g. Dpto A
|
||||||
alpha_plus_numeric_whitespace_probability: 0.1
|
alpha_plus_numeric:
|
||||||
numeric_plus_alpha_whitespace_probability: 0.1
|
whitespace_probability: 0.1
|
||||||
|
numeric_plus_alpha:
|
||||||
|
whitespace_probability: 0.1
|
||||||
|
|
||||||
|
|
||||||
alphanumeric_apartamento: &unit_alphanumeric_apartamento
|
alphanumeric_apartamento: &unit_alphanumeric_apartamento
|
||||||
@@ -697,9 +779,7 @@ units:
|
|||||||
- alternative: *casa
|
- alternative: *casa
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
- alternative: *puerta
|
- alternative: *puerta
|
||||||
probability: 0.045
|
probability: 0.05
|
||||||
- alternative: *atico
|
|
||||||
probability: 0.005
|
|
||||||
|
|
||||||
alphanumeric_apartamento_exclusive: &unit_alphanumeric_apartamento_exclusive
|
alphanumeric_apartamento_exclusive: &unit_alphanumeric_apartamento_exclusive
|
||||||
<<: *unit_alphanumeric
|
<<: *unit_alphanumeric
|
||||||
@@ -709,9 +789,7 @@ units:
|
|||||||
- alternative: *casa
|
- alternative: *casa
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
- alternative: *puerta
|
- alternative: *puerta
|
||||||
probability: 0.045
|
probability: 0.05
|
||||||
- alternative: *atico
|
|
||||||
probability: 0.005
|
|
||||||
|
|
||||||
zones:
|
zones:
|
||||||
residential: *unit_alphanumeric
|
residential: *unit_alphanumeric
|
||||||
@@ -755,28 +833,14 @@ units:
|
|||||||
parcel_plus_lot_probability: 0.02
|
parcel_plus_lot_probability: 0.02
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
# For unit types like 2o/B
|
|
||||||
combined:
|
|
||||||
component: level
|
|
||||||
direction: right
|
|
||||||
separators:
|
|
||||||
- separator: /
|
|
||||||
probability: 0.2
|
|
||||||
- separator: " "
|
|
||||||
probability: 0.6
|
|
||||||
- separator: " - "
|
|
||||||
probability: 0.2
|
|
||||||
|
|
||||||
# If no unit number is specified
|
|
||||||
alphanumeric_probability: 0.75
|
|
||||||
standalone_probability: 0.2495
|
|
||||||
combined_probability: 0.005
|
|
||||||
|
|
||||||
|
|
||||||
countries:
|
countries:
|
||||||
# España / Spain
|
# España / Spain
|
||||||
es:
|
es:
|
||||||
|
components:
|
||||||
|
staircase:
|
||||||
|
null_probability: 0.97
|
||||||
|
alphanumeric_probability: 0.02
|
||||||
|
directional_probability: 0.01
|
||||||
levels:
|
levels:
|
||||||
planta: &planta
|
planta: &planta
|
||||||
# Everywhere except Spain
|
# Everywhere except Spain
|
||||||
@@ -897,9 +961,7 @@ countries:
|
|||||||
- alternative: *apartamento
|
- alternative: *apartamento
|
||||||
probability: 0.1
|
probability: 0.1
|
||||||
- alternative: *casa
|
- alternative: *casa
|
||||||
probability: 0.05
|
probability: 0.1
|
||||||
- alternative: *atico
|
|
||||||
probability: 0.05
|
|
||||||
|
|
||||||
zones:
|
zones:
|
||||||
residential: *unit_alphanumeric_puerta
|
residential: *unit_alphanumeric_puerta
|
||||||
|
|||||||
Reference in New Issue
Block a user