diff --git a/resources/addresses/es.yaml b/resources/addresses/es.yaml index f55ab75f..10905d3b 100644 --- a/resources/addresses/es.yaml +++ b/resources/addresses/es.yaml @@ -3,6 +3,64 @@ # Note: make Latin-American conventions by default (country overrides for Spain # as well as any other country-specific norms) +components: + po_box: + null_probability: 0.9 + alphanumeric_probability: 0.1 + conditional: + - component: level + probabilities: + null_probability: 0.995 + alphanumeric_probability: 0.005 + - component: unit + probabilities: + null_probability: 0.99 + alphanumeric_probability: 0.01 + - component: staircase + probabilities: + null_probability: 0.999 + alphanumeric_probability: 0.001 + - component: entrance + probabilities: + null_probability: 0.999 + alphanumeric_probability: 0.001 + + level: + # If no floor number is specified + null_probability: 0.6 + alphanumeric_probability: 0.35 + standalone_probability: 0.05 + + staircase: + null_probability: 0.989 + alphanumeric_probability: 0.01 + directional_probability: 0.001 + + entrance: + null_probability: 0.9999 + alphanumeric_probability: 0.0001 + + unit: + # If no unit number is specified + null_probability: 0.3 + alphanumeric_probability: 0.65 + standalone_probability: 0.05 + + combinations: + level_unit: + components: + - level + - unit + label: unit + separators: + - separator: / + probability: 0.2 + - separator: " " + probability: 0.6 + - separator: " - " + probability: 0.2 + probability: 0.005 + numbers: default: &numero canonical: número @@ -198,10 +256,6 @@ levels: canonical_probability: 0.7 abbreviated_probability: 0.1 sample_probability: 0.2 - numeric: - direction: left - numeric_probability: 0.4 - standalone_probability: 0.6 sobreatico: &sobreatico canonical: sobreatico aliases: @@ -251,17 +305,6 @@ levels: numeric_probability: 0.99 alpha_probability: 0.01 - order: - # e.g. Calle Ruiz de Alarcón 23 piso 3 - - after: house_number - probability: 0.8 - # e.g. Piso 3, Museo del Prado, Calle Ruiz de Alarcón 23 - - before: house - probability: 0.1 - # e.g. Museo del Prado, Bajos, Calle Ruiz de Alarcón 23 - - before: road - probability: 0.1 - blocks: default: canonical: bloque @@ -373,14 +416,10 @@ po_boxes: alpha_probability: 0.05 # Apdo A numeric_plus_alpha_probability: 0.04 # Apdo 123G alpha_plus_numeric_probability: 0.01 # Apdo A123 - alpha_plus_numeric_whitespace_probability: 0.1 - numeric_plus_alpha_whitespace_probability: 0.1 - - order: - - after: house - probability: 0.8 - - before: house - probability: 0.2 + alpha_plus_numeric: + whitespace_probability: 0.1 + numeric_plus_alpha: + whitespace_probability: 0.1 postcodes: alphanumeric: @@ -535,7 +574,34 @@ entrances: canonical_probability: 0.5 abbreviated_probability: 0.2 sample_probability: 0.3 + numeric: + direction: left + # Entrance 1, Entrance A, etc. + alphanumeric: + default: *entrada + numeric_probability: 0.1 # e.g. Entrance 1 + alpha_probability: 0.85 # e.g. Entrnace A + numeric_plus_alpha_probability: 0.025 # e.g. 1A + alpha_plus_numeric_probability: 0.025 # e.g. A1 + + alpha_plus_numeric: + whitespace_probability: 0.1 + + numeric_plus_alpha: + whitespace_probability: 0.1 + + directional: + modifier: + alternatives: + - alternative: *norte + - alternative: *sur + - alternative: *este + - alternative: *oeste + - alternative: *derecha + - alternative: *izquierda + - alternative: *trasera + - alternative: *frente staircases: escalera: &escalera @@ -545,22 +611,38 @@ staircases: canonical_probability: 0.3 abbreviated_probability: 0.4 sample_probability: 0.3 + numeric: + direction: left + + alphanumeric: + # For alphanumerics, Stair A, Stair 1, etc. + default: *escalera + numeric_probability: 0.6 # e.g. Escalera 1 + alpha_probability: 0.35 # e.g. Escalera A + numeric_plus_alpha_probability: 0.025 # e.g. 1A + alpha_plus_numeric_probability: 0.025 # e.g. A1 + + alpha_plus_numeric: + whitespace_probability: 0.1 + + numeric_plus_alpha: + whitespace_probability: 0.1 + + directional: + direction: right # e.g. Escalera Izq + direction_probability: 0.8 + modifier: + alternatives: + - alternative: *norte + - alternative: *sur + - alternative: *este + - alternative: *oeste + - alternative: *derecha + - alternative: *izquierda + - alternative: *trasera + - alternative: *frente units: - # Units are not part of the global address formats (and are not always standard) - # This is a list of places in the address where the unit line might go - order: - - before: house - probability: 0.05 - - before: road - probability: 0.05 - # e.g. Piso 3 Dpto 12 (most common) - - after: level - probability: 0.8 - # e.g. Apto 6, 2o piso (less common) - - before: level - probability: 0.1 - apartment: &apartamento canonical: apartamento abbreviated: apto @@ -669,9 +751,7 @@ units: - alternative: *casa probability: 0.05 - alternative: *puerta - probability: 0.045 - - alternative: *atico - probability: 0.005 + probability: 0.05 # Separate random probability for adding directions like 2o Izq, 2 Dcha, etc. add_direction: true @@ -683,8 +763,10 @@ units: numeric_plus_alpha_probability: 0.01 # e.g. Dpto 1A alpha_plus_numeric_probability: 0.01 # e.g. Dpto A1 alpha_probability: 0.08 # e.g. Dpto A - alpha_plus_numeric_whitespace_probability: 0.1 - numeric_plus_alpha_whitespace_probability: 0.1 + alpha_plus_numeric: + whitespace_probability: 0.1 + numeric_plus_alpha: + whitespace_probability: 0.1 alphanumeric_apartamento: &unit_alphanumeric_apartamento @@ -697,9 +779,7 @@ units: - alternative: *casa probability: 0.05 - alternative: *puerta - probability: 0.045 - - alternative: *atico - probability: 0.005 + probability: 0.05 alphanumeric_apartamento_exclusive: &unit_alphanumeric_apartamento_exclusive <<: *unit_alphanumeric @@ -709,9 +789,7 @@ units: - alternative: *casa probability: 0.05 - alternative: *puerta - probability: 0.045 - - alternative: *atico - probability: 0.005 + probability: 0.05 zones: residential: *unit_alphanumeric @@ -755,28 +833,14 @@ units: parcel_plus_lot_probability: 0.02 - - # For unit types like 2o/B - combined: - component: level - direction: right - separators: - - separator: / - probability: 0.2 - - separator: " " - probability: 0.6 - - separator: " - " - probability: 0.2 - - # If no unit number is specified - alphanumeric_probability: 0.75 - standalone_probability: 0.2495 - combined_probability: 0.005 - - countries: # España / Spain es: + components: + staircase: + null_probability: 0.97 + alphanumeric_probability: 0.02 + directional_probability: 0.01 levels: planta: &planta # Everywhere except Spain @@ -897,9 +961,7 @@ countries: - alternative: *apartamento probability: 0.1 - alternative: *casa - probability: 0.05 - - alternative: *atico - probability: 0.05 + probability: 0.1 zones: residential: *unit_alphanumeric_puerta