AlertsSpecification.md

tosca_definitions_version: tosca_simple_profile_for_nfv_1_0_0

description: TOSCA Alerts Configuration document

imports:
- flame_clmc_alerts_definitions.yaml

metadata:
  sfc: companyA-VR
  sfci: companyA-VR-premium

topology_template:

  policies:
    - high_latency_policy:
        type: eu.ict-flame.policies.StateChange
        triggers:
          high_latency:
            description: This event triggers when the mean network latency in a given location exceeds a given threshold (in ms).
            event_type: threshold
            metric: network.latency
            condition:
              threshold: 45
              granularity: 120
              aggregation_method: mean
              resource_type:
                flame_location: watershed
              comparison_operator: gt
            action:
              implementation:
                - flame_sfemc
                - http://companyA.alert-handler.flame.eu/high-latency

    - low_requests_policy:
        type: eu.ict-flame.policies.StateChange
        triggers:
          low_requests:
            description: |
              This event triggers when the last reported number of requests for a given service function
              falls behind a given threshold.
            event_type: threshold
            metric: storage.requests
            condition:
              threshold: 5
              granularity: 60
              aggregation_method: last
              resource_type:
                flame_sfp: storage
                flame_sf: storage-users
                location: watershed
              comparison_operator: lt
            action:
              implementation:
                - flame_sfemc
                - http://companyA.alert-handler.flame.eu/low-requests

    - requests_diff_policy:
        type: eu.ict-flame.policies.StateChange
        triggers:
          increase_in_requests:
            description: |
              This event triggers when the number of requests has increased relative to the number of requests received
              120 seconds ago.
            event_type: relative
            metric: storage.requests
            condition:
              threshold: 100  # requests have increased by at least 100
              granularity: 120
              resource_type:
                flame_sfp: storage
                flame_sf: storage-users
                flame_server: watershed
                flame_location: watershed
              comparison_operator: gte
            action:
              implementation:
                - flame_sfemc
          decrease_in_requests:
            description: |
              This event triggers when the number of requests has decreased relative to the number of requests received
              120 seconds ago.
            event_type: relative
            metric: storage.requests
            condition:
              threshold: -100  # requests have decreased by at least 100
              granularity: 120
              resource_type:
                flame_sfp: storage
                flame_sf: storage-users
                flame_location: watershed
              comparison_operator: lte
            action:
              implementation:
                - flame_sfemc

    - missing_measurement_policy:
        type: eu.ict-flame.policies.StateChange
        triggers:
          missing_storage_measurements:
            description: This event triggers when the number of storage measurements reported falls below the threshold value.
            event_type: deadman
            # deadman trigger instances monitor the whole measurement (storage in this case), so simply put a star for field value
            # to be compliant with the <measurement>.<field> format
            metric: storage.*
            condition:
              threshold: 0  # if requests are less than or equal to 0 (in other words, no measurements are reported)
              granularity: 60  # check for for missing data for the last 60 seconds
              resource_type:
                flame_sfp: storage
            action:
              implementation:
                - http://companyA.alert-handler.flame.eu/missing-measurements
metadata:
    sfc: <sfc_id>
    sfci: <sfc_i_id>
topology_template:

    policies:
        - <policy_identifier>:
            type: eu.ict-flame.policies.StateChange
            triggers:
                <event identifier>:
                  description: <optional description for the given event trigger>
                  event_type: <threshold | relative | deadman>
                  metric: <measurement>.<field>
                  condition:
                    threshold: <critical value - semantics depend on the event type>
                    granularity: <period in seconds - semantic depends on the event type>
                    aggregation_method: <aggregation function supported by InfluxDB - e.g. 'mean'>
                    resource_type:
                      <CLMC Information Model Tag Name>: <CLMC Information Model Tag Value>
                      <CLMC Information Model Tag Name>: <CLMC Information Model Tag Value>
                      ...
                    comparison_operator: <logical operator to use for comparison, e.g. 'gt', 'lt', 'gte', etc.
                  action:
                    implementation:
                      - <flame_sfemc or HTTP Alert Handler URL - receives POST messages from Kapacitor when alerts trigger>
                      - <flame_sfemc or HTTP Alert Handler URL - receives POST messages from Kapacitor when alerts trigger>
                      ...
        ...
high_latency:
    description: This event triggers when the mean network latency in a given location exceeds a given threshold (in ms).
    event_type: threshold
    metric: network.latency
    condition:
      threshold: 45
      granularity: 120
      aggregation_method: mean
      resource_type:
        flame_location: watershed
      comparison_operator: gt
    action:
      implementation:
        - flame_sfemc
        - http://companyA.alert-handler.flame.eu/high-latency
"lt" : "less than",
"gt" : "greater than",
"lte" : "less than or equal to",
"gte" : "greater than or equal to",
"eq" : "equal",
"neq" : "not equal"
decrease_in_requests:
    description: |
      This event triggers when the number of requests has decreased relative to the number of requests received
      120 seconds ago.
    event_type: relative
    metric: storage.requests
    condition:
      threshold: -100
      granularity: 120
      resource_type:
        flame_sfp: storage
        flame_sf: storage-users
        flame_location: watershed
      comparison_operator: lte
    action:
      implementation:
        - flame_sfemc
missing_storage_measurements:
    description: This event triggers when the number of storage measurements reported falls below the threshold value.
    event_type: deadman
    metric: storage.*
    condition:
      threshold: 0
      granularity: 60
      resource_type:
        flame_sfp: storage
    action:
      implementation:
        - flame_sfemc