zoukankan      html  css  js  c++  java
  • prometheus+alertmanage+grafana安装部署

    部署prometheus-operator
    #克隆kube-prometheus项目
    git clone https://github.com/coreos/kube-prometheus.git
    
    
    cd kube-prometheus/manifests
    mkdir prometheus-operator
    mv 0*  prometheus-operator
    cd prometheus-operator
    kubectl apply -f . 
    
    
    #查看是否部署成功
    kubectl -n monitoring get pod -o wide
    kubectl -n monitoring get svc
    kubectl -n monitoring get sevicemonitor
    
    
    
    Alertmanager 部署
    cd kube-prometheus/manifests
    mkdir alertmanager
    mv alertmanager*  alertmanager
    cd alertmanager
    #添加外部访问,使用svc nodeport
    vim alertmanager-service.yaml
    apiVersion: v1
    kind: Service
    metadata:
      labels:
        alertmanager: main
      name: alertmanager-main
      namespace: monitoring
    spec:
      ports:
      - name: web
        port: 9093
        targetPort: web
        nodePort: 30903 
      type: NodePort
      selector:
        alertmanager: main
        app: alertmanager
      sessionAffinity: ClientIP
    #安装部署  
    kubectl apply -f . 
    
    #查看部署是否成功
    kubectl -n monitoring get pod -o wide
    kubectl -n monitoring get svc
    
    
    
    #修改alertmanage配置,先删除默认配置
    #prometheus alertmanager 支持配置自动发现和更新
    kubectl delete secret alertmanager-main -n monitoring
    #开启邮件报警
    vim alertmanager.yaml
    global:
      resolve_timeout: 5m
      smtp_smarthost: 'smtp.163.com:25'
      smtp_from: 'prometheus_alert01@163.com'
      smtp_auth_username: 'prometheus_alert01@163.com'
      smtp_auth_password: '邮箱密码'
    
    route:
      group_by: ['job', 'altername', 'cluster', 'service','severity']
      group_wait: 30s
      group_interval: 5m
      repeat_interval: 20m
      receiver: 'team-ops-mails'
    
      routes:
      - match_re:
          service: ^(foo1|foo2|baz)$
        receiver: 'team-ops-mails'
        routes:
        - match:
            severity: critical
          receiver: 'team-ops-mails'
      - match:
          service: database
        receiver: 'team-ops-mails'
      - match:
          severity: critical
        receiver: 'team-ops-mails'
    inhibit_rules:
    - source_match:
        severity: 'critical'
      target_match:
        severity: 'warning'
    receivers:
    - name: 'team-ops-mails'
      email_configs:
      - to: 'xieyi5420@163.com'
    
    
    #重新生成secret配置
    kubectl create secret generic alertmanager-main --from-file=alertmanager.yaml -n monitoring
    
    
    #打开浏览器验证配置
    http://nodeip:30903
    
    
    
    
    
    prometheus 部署
    cd kube-prometheus/manifests
    mkdir prometheus 
    mv prometheus-cluster* prometheus
    mv prometheus-prometheus.yaml prometheus
    mv prometheus-role* prometheus
    mv prometheus-rules.yaml prometheus
    mv prometheus-service* prometheus
    
    # 以后所有系统业务的监控yaml 放到此文件夹
    mkdir prometheus-monitor
    mv prometheus-service*  prometheus-monitor
    
    
    #创建etcd secret
    kubectl -n monitoring create secret generic etcd-certs --from-file=ca.pem --from-file=etcd-key.pem  --from-file=etcd.pem
    
    cd prometheus
    #修改
    vim prometheus-prometheus.yaml
    apiVersion: monitoring.coreos.com/v1
    kind: Prometheus
    metadata:
      labels:
        prometheus: k8s
      name: k8s
      namespace: monitoring
    spec:
      alerting:
        alertmanagers:
        - name: alertmanager-main
          namespace: monitoring
          port: web
      baseImage: quay.io/prometheus/prometheus
      nodeSelector:
        beta.kubernetes.io/os: linux
      replicas: 2
      secrets:
        # 添加etcd 证书
      - etcd-certs
      resources:
        requests:
              # 设置内存大小
          memory: 2048Mi
        # 设置数据保留天数
      retention: 7d
        # 创建外部存储pvc
      storage:
        volumeClaimTemplate:
          spec:
            accessModes:
            - ReadWriteOnce
            metadata:
              annotations:
                 volume.beta.kubernetes.io/storage-class: "managed-nfs-storage"
                 #storageclass.kubernetes.io/is-default-class: true # 使用那种动态存储 设置默认动态存储
              labels:
                prometheus: ingest-webrtc
            resources:
              requests:
                storage: 100Gi # 存储空间大小
      ruleSelector:
        matchLabels:
          prometheus: k8s
          role: alert-rules
      securityContext:
        fsGroup: 2000
        runAsNonRoot: true
        runAsUser: 1000
      serviceAccountName: prometheus-k8s
      serviceMonitorNamespaceSelector: {}
      serviceMonitorSelector: {}
      version: v2.11.0 # 版本号
    
    #暴露端口提供外部访问nodeport
    vim prometheus-service.yaml
    apiVersion: v1
    kind: Service
    metadata:
      labels:
        prometheus: k8s
      name: prometheus-k8s
      namespace: monitoring
    spec:
      ports:
      - name: web
        port: 9090
        targetPort: web
        nodePort: 30900
      type: NodePort
      selector:
        app: prometheus
        prometheus: k8s
      sessionAffinity: ClientIP
    
    #验证
    [root@k8s-master01 prometheus]# kubectl -n monitoring get pods | grep prometheus-k8s
    prometheus-k8s-0                       3/3     Running   1          9m43s
    prometheus-k8s-1                       3/3     Running   1          9m43s
    
    #验证pv pvc
    [root@k8s-master01 prometheus]# kubectl -n monitoring get pv
    NAME                                       CAPACITY   ACCESS MODES   RECLAIM POLICY   STATUS   CLAIM                                           STORAGECLASS          REASON   AGE
    pvc-44fb9246-5bc2-489e-bd46-22eae420c9bc   100Gi      RWO            Delete           Bound    monitoring/prometheus-k8s-db-prometheus-k8s-0   managed-nfs-storage            10m
    pvc-c46161f3-32d1-4294-9b64-f16aba5b3595   100Gi      RWO            Delete           Bound    monitoring/prometheus-k8s-db-prometheus-k8s-1   managed-nfs-storage            10m
    [root@k8s-master01 prometheus]# kubectl -n monitoring get pvc
    NAME                                 STATUS   VOLUME                                     CAPACITY   ACCESS MODES   STORAGECLASS          AGE
    prometheus-k8s-db-prometheus-k8s-0   Bound    pvc-44fb9246-5bc2-489e-bd46-22eae420c9bc   100Gi      RWO            managed-nfs-storage   11m
    prometheus-k8s-db-prometheus-k8s-1   Bound    pvc-c46161f3-32d1-4294-9b64-f16aba5b3595   100Gi      RWO            managed-nfs-storage   11m
    
    
    #创建监控服务
    cd ../prometheus-monitor/
    vim prometheus-serviceMonitorKubelet.yaml 
    apiVersion: monitoring.coreos.com/v1
    kind: ServiceMonitor
    metadata:
      labels:
        k8s-app: kubelet
      name: kubelet
      namespace: monitoring
    spec:
      endpoints:
      - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
        honorLabels: true
        interval: 30s
        port: https-metrics
        scheme: https
        tlsConfig:
          insecureSkipVerify: true
      - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
        honorLabels: true
        interval: 30s
        path: /metrics/cadvisor
        port: https-metrics
        scheme: https
        tlsConfig:
          insecureSkipVerify: true
      jobLabel: k8s-app
      namespaceSelector:
        matchNames:
        - kube-system
      selector:
        matchLabels:
          k8s-app: kubelet
    
    
    #创建etcd监控
    vim prometheus-serviceMonitorEtcd.yaml
    apiVersion: v1
    kind: Service
    metadata:
      labels:
        k8s-app: etcd
      name: etcd
      namespace: monitoring
    spec:
      clusterIP: None
      ports:
      - name: https-metrics
        port: 2379
        protocol: TCP
        targetPort: 2379
      sessionAffinity: None
      type: ClusterIP
    ---
    apiVersion: v1
    kind: Endpoints
    metadata:
      labels:
        k8s-app: etcd
      name: etcd
      namespace: monitoring
    subsets:
    - addresses:
      - ip: 172.23.219.121
        nodeName: k8s-master01
      - ip: 172.23.219.122
        nodeName: k8s-master02
      - ip: 172.23.219.123
        nodeName: k8s-master03
      ports:
      - name: https-metrics
        port: 2379
        protocol: TCP
    ---
    apiVersion: monitoring.coreos.com/v1
    kind: ServiceMonitor
    metadata:
      labels:
        app: etcd
      name: etcd
      namespace: monitoring
    spec:
      endpoints:
      - interval: 10s
        port: https-metrics
        scheme: https
        tlsConfig:
          caFile: /etc/prometheus/secrets/etcd-certs/ca.pem
          certFile: /etc/prometheus/secrets/etcd-certs/etcd.pem
          keyFile: /etc/prometheus/secrets/etcd-certs/etcd-key.pem
          insecureSkipVerify: true
      namespaceSelector:
        matchNames:
        - monitoring
      selector:
        matchLabels:
          k8s-app: etcd
    
    #kube-scheduler 监控 不在k8s集群内部所以要创建Endpoints
    vim  prometheus-serviceMonitorKubeScheduler.yaml
    apiVersion: v1
    kind: Service
    metadata:
      labels:
        k8s-app: kube-scheduler
      name: kube-scheduler
      namespace: monitoring
    spec:
      clusterIP: None
      ports:
      - name: http-metrics
        port: 10251
        protocol: TCP
        targetPort: 10251
      sessionAffinity: None
      type: ClusterIP
    ---
    apiVersion: v1
    kind: Endpoints
    metadata:
      labels:
        k8s-app: kube-scheduler
      name: kube-scheduler
      namespace: monitoring
    subsets:
    - addresses:
      - ip: 172.23.219.121
        nodeName: k8s-master01
      - ip: 172.23.219.122
        nodeName: k8s-master02
      - ip: 172.23.219.123
        nodeName: k8s-master03
      ports:
      - name: http-metrics
        port: 10251
        protocol: TCP
    ---
    apiVersion: monitoring.coreos.com/v1
    kind: ServiceMonitor
    metadata:
      labels:
        app: kube-scheduler
      name: kube-scheduler
      namespace: monitoring
    spec:
      endpoints:
      - interval: 10s
        port: http-metrics
      namespaceSelector:
        matchNames:
        - monitoring
      selector:
        matchLabels:
          k8s-app: kube-scheduler
    
    vim prometheus-serviceMonitorKubeControllerManager.yaml
    apiVersion: v1
    kind: Service
    metadata:
      labels:
        k8s-app: kube-controller-manager
      name: kube-controller-manager
      namespace: monitoring
    spec:
      clusterIP: None
      ports:
      - name: http-controller
        port: 10252
        protocol: TCP
        targetPort: 10252
      sessionAffinity: None
      type: ClusterIP
    ---
    apiVersion: v1
    kind: Endpoints
    metadata:
      labels:
        k8s-app: kube-controller-manager
      name: kube-controller-manager
      namespace: monitoring
    subsets:
    - addresses:
      - ip: 172.23.219.121
        nodeName: k8s-master01
      - ip: 172.23.219.122
        nodeName: k8s-master02
      - ip: 172.23.219.123
        nodeName: k8s-master03
      ports:
      - name: http-controller
        port: 10252
        protocol: TCP
    ---
    apiVersion: monitoring.coreos.com/v1
    kind: ServiceMonitor
    metadata:
      labels:
        app: kube-controller-manager
      name: kube-controller-manager
      namespace: monitoring
    spec:
      endpoints:
      - interval: 10s
        port: http-controller
      namespaceSelector:
        matchNames:
        - monitoring
      selector:
        matchLabels:
          k8s-app: kube-controller-manager
    
    
    vim  prometheus-serviceMonitorApiserver.yaml
    apiVersion: monitoring.coreos.com/v1
    kind: ServiceMonitor
    metadata:
      labels:
        k8s-app: apiserver
      name: kube-apiserver
      namespace: monitoring
    spec:
      endpoints:
      - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
        interval: 30s
        port: https
        scheme: https
        tlsConfig:
          caFile: /var/run/secrets/kubernetes.io/serviceaccount/ca.crt
          serverName: kubernetes
      jobLabel: component
      namespaceSelector:
        matchNames:
        - default
      selector:
        matchLabels:
          component: apiserver
          provider: kubernetes
    
    
    #创建
    kubectl apply -f . 
    
    验证
    
    创建 grafana 服务
    mkdir grafana
    mv gragana-* grafana
    vim grafana-pvc.yaml
    kind: PersistentVolumeClaim
    apiVersion: v1
    metadata:
      name: grafana-pvc
      namespace: monitoring
    spec:
      accessModes:
        - ReadWriteMany
      storageClassName: managed-nfs-storage
      resources:
        requests:
          storage: 50Gi
    
    
    vim grafana-configmap.yaml
    apiVersion: v1
    data:
      grafana.ini: |
        ##################### Grafana Configuration Example #####################
        #
        # Everything has defaults so you only need to uncomment things you want to
        # change
    
        # possible values : production, development
        ; app_mode = production
    
        # instance name, defaults to HOSTNAME environment variable value or hostname if HOSTNAME var is empty
        ; instance_name = ${HOSTNAME}
    
        #################################### Paths ####################################
        [paths]
        # Path to where grafana can store temp files, sessions, and the sqlite3 db (if that is used)
        ;data = /var/lib/grafana
    
        # Directory where grafana can store logs
        ;logs = /var/log/grafana
    
        # Directory where grafana will automatically scan and look for plugins
        ;plugins = /var/lib/grafana/plugins
    
        # folder that contains provisioning config files that grafana will apply on startup and while running.
        ; provisioning = conf/provisioning
    
        #################################### Server ####################################
        [server]
        # Protocol (http, https, socket)
        ;protocol = http
    
        # The ip address to bind to, empty will bind to all interfaces
        ;http_addr =
    
        # The http port  to use
        ;http_port = 3000
    
        # The public facing domain name used to access grafana from a browser
        ;domain = localhost
    
        # Redirect to correct domain if host header does not match domain
        # Prevents DNS rebinding attacks
        ;enforce_domain = false
    
        # The full public facing url you use in browser, used for redirects and emails
        # If you use reverse proxy and sub path specify full url (with sub path)
        ;root_url = http://localhost:3000
    
        # Log web requests
        ;router_logging = false
    
        # the path relative working path
        ;static_root_path = public
    
        # enable gzip
        ;enable_gzip = false
    
        # https certs & key file
        ;cert_file =
        ;cert_key =
    
        # Unix socket path
        ;socket =
    
        #################################### Database ####################################
        [database]
        # You can configure the database connection by specifying type, host, name, user and password
        # as seperate properties or as on string using the url propertie.
    
        # Either "mysql", "postgres" or "sqlite3", it's your choice
        ;type = sqlite3
        ;host = 127.0.0.1:3306
        ;name = grafana
        ;user = root
        # If the password contains # or ; you have to wrap it with triple quotes. Ex """#password;"""
        ;password =
    
        # Use either URL or the previous fields to configure the database
        # Example: mysql://user:secret@host:port/database
        ;url =
    
        # For "postgres" only, either "disable", "require" or "verify-full"
        ;ssl_mode = disable
    
        # For "sqlite3" only, path relative to data_path setting
        ;path = grafana.db
    
        # Max idle conn setting default is 2
        ;max_idle_conn = 2
    
        # Max conn setting default is 0 (mean not set)
        ;max_open_conn =
    
        # Connection Max Lifetime default is 14400 (means 14400 seconds or 4 hours)
        ;conn_max_lifetime = 14400
    
        # Set to true to log the sql calls and execution times.
        log_queries =
    
        #################################### Session ####################################
        [session]
        # Either "memory", "file", "redis", "mysql", "postgres", default is "file"
        ;provider = file
    
        # Provider config options
        # memory: not have any config yet
        # file: session dir path, is relative to grafana data_path
        # redis: config like redis server e.g. `addr=127.0.0.1:6379,pool_size=100,db=grafana`
        # mysql: go-sql-driver/mysql dsn config string, e.g. `user:password@tcp(127.0.0.1:3306)/database_name`
        # postgres: user=a password=b host=localhost port=5432 dbname=c sslmode=disable
        ;provider_config = sessions
    
        # Session cookie name
        ;cookie_name = grafana_sess
    
        # If you use session in https only, default is false
        ;cookie_secure = false
    
        # Session life time, default is 86400
        ;session_life_time = 86400
    
        #################################### Data proxy ###########################
        [dataproxy]
    
        # This enables data proxy logging, default is false
        ;logging = false
    
        #################################### Analytics ####################################
        [analytics]
        # Server reporting, sends usage counters to stats.grafana.org every 24 hours.
        # No ip addresses are being tracked, only simple counters to track
        # running instances, dashboard and error counts. It is very helpful to us.
        # Change this option to false to disable reporting.
        ;reporting_enabled = true
    
        # Set to false to disable all checks to https://grafana.net
        # for new vesions (grafana itself and plugins), check is used
        # in some UI views to notify that grafana or plugin update exists
        # This option does not cause any auto updates, nor send any information
        # only a GET request to http://grafana.com to get latest versions
        ;check_for_updates = true
    
        # Google Analytics universal tracking code, only enabled if you specify an id here
        ;google_analytics_ua_id =
    
        #################################### Security ####################################
        [security]
        # default admin user, created on startup
        ;admin_user = admin
    
        # default admin password, can be changed before first start of grafana,  or in profile settings
        ;admin_password = admin
    
        # used for signing
        ;secret_key = SW2YcwTIb9zpOOhoPsMm
    
        # Auto-login remember days
        ;login_remember_days = 7
        ;cookie_username = grafana_user
        ;cookie_remember_name = grafana_remember
    
        # disable gravatar profile images
        ;disable_gravatar = false
    
        # data source proxy whitelist (ip_or_domain:port separated by spaces)
        ;data_source_proxy_whitelist =
    
        # disable protection against brute force login attempts
        ;disable_brute_force_login_protection = false
    
        #################################### Snapshots ###########################
        [snapshots]
        # snapshot sharing options
        ;external_enabled = true
        ;external_snapshot_url = https://snapshots-origin.raintank.io
        ;external_snapshot_name = Publish to snapshot.raintank.io
    
        # remove expired snapshot
        ;snapshot_remove_expired = true
    
        #################################### Dashboards History ##################
        [dashboards]
        # Number dashboard versions to keep (per dashboard). Default: 20, Minimum: 1
        ;versions_to_keep = 20
    
        #################################### Users ###############################
        [users]
        # disable user signup / registration
        ;allow_sign_up = true
    
        # Allow non admin users to create organizations
        ;allow_org_create = true
    
        # Set to true to automatically assign new users to the default organization (id 1)
        ;auto_assign_org = true
    
        # Default role new users will be automatically assigned (if disabled above is set to true)
        ;auto_assign_org_role = Viewer
    
        # Background text for the user field on the login page
        ;login_hint = email or username
    
        # Default UI theme ("dark" or "light")
        ;default_theme = dark
    
        # External user management, these options affect the organization users view
        ;external_manage_link_url =
        ;external_manage_link_name =
        ;external_manage_info =
    
        # Viewers can edit/inspect dashboard settings in the browser. But not save the dashboard.
        ;viewers_can_edit = false
    
        [auth]
        # Set to true to disable (hide) the login form, useful if you use OAuth, defaults to false
        ;disable_login_form = false
    
        # Set to true to disable the signout link in the side menu. useful if you use auth.proxy, defaults to false
        ;disable_signout_menu = false
    
        #################################### Anonymous Auth ##########################
        [auth.anonymous]
        # enable anonymous access
        ;enabled = false
    
        # specify organization name that should be used for unauthenticated users
        ;org_name = Main Org.
    
        # specify role for unauthenticated users
        ;org_role = Viewer
    
        #################################### Github Auth ##########################
        [auth.github]
        ;enabled = false
        ;allow_sign_up = true
        ;client_id = some_id
        ;client_secret = some_secret
        ;scopes = user:email,read:org
        ;auth_url = https://github.com/login/oauth/authorize
        ;token_url = https://github.com/login/oauth/access_token
        ;api_url = https://api.github.com/user
        ;team_ids =
        ;allowed_organizations =
    
        #################################### Google Auth ##########################
        [auth.google]
        ;enabled = false
        ;allow_sign_up = true
        ;client_id = some_client_id
        ;client_secret = some_client_secret
        ;scopes = https://www.googleapis.com/auth/userinfo.profile https://www.googleapis.com/auth/userinfo.email
        ;auth_url = https://accounts.google.com/o/oauth2/auth
        ;token_url = https://accounts.google.com/o/oauth2/token
        ;api_url = https://www.googleapis.com/oauth2/v1/userinfo
        ;allowed_domains =
    
        #################################### Generic OAuth ##########################
        [auth.generic_oauth]
        ;enabled = false
        ;name = OAuth
        ;allow_sign_up = true
        ;client_id = some_id
        ;client_secret = some_secret
        ;scopes = user:email,read:org
        ;auth_url = https://foo.bar/login/oauth/authorize
        ;token_url = https://foo.bar/login/oauth/access_token
        ;api_url = https://foo.bar/user
        ;team_ids =
        ;allowed_organizations =
    
        #################################### Grafana.com Auth ####################
        [auth.grafana_com]
        ;enabled = false
        ;allow_sign_up = true
        ;client_id = some_id
        ;client_secret = some_secret
        ;scopes = user:email
        ;allowed_organizations =
    
        #################################### Auth Proxy ##########################
        [auth.proxy]
        ;enabled = false
        ;header_name = X-WEBAUTH-USER
        ;header_property = username
        ;auto_sign_up = true
        ;ldap_sync_ttl = 60
        ;whitelist = 192.168.1.1, 192.168.2.1
    
        #################################### Basic Auth ##########################
        [auth.basic]
        ;enabled = true
    
        #################################### Auth LDAP ##########################
        [auth.ldap]
        ;enabled = false
        ;config_file = /etc/grafana/ldap.toml
        ;allow_sign_up = true
    
        #################################### SMTP / Emailing ##########################
        [smtp]
        ;enabled = false
        ;host = localhost:25
        ;user =
        # If the password contains # or ; you have to wrap it with trippel quotes. Ex """#password;"""
        ;password =
        ;cert_file =
        ;key_file =
        ;skip_verify = false
        ;from_address = admin@grafana.localhost
        ;from_name = Grafana
        # EHLO identity in SMTP dialog (defaults to instance_name)
        ;ehlo_identity = dashboard.example.com
    
        [emails]
        ;welcome_email_on_sign_up = false
    
        #################################### Logging ##########################
        [log]
        # Either "console", "file", "syslog". Default is console and  file
        # Use space to separate multiple modes, e.g. "console file"
        ;mode = console file
    
        # Either "debug", "info", "warn", "error", "critical", default is "info"
        ;level = info
    
        # optional settings to set different levels for specific loggers. Ex filters = sqlstore:debug
        ;filters =
    
        # For "console" mode only
        [log.console]
        ;level =
    
        # log line format, valid options are text, console and json
        ;format = console
    
        # For "file" mode only
        [log.file]
        ;level =
    
        # log line format, valid options are text, console and json
        ;format = text
    
        # This enables automated log rotate(switch of following options), default is true
        ;log_rotate = true
    
        # Max line number of single file, default is 1000000
        ;max_lines = 1000000
    
        # Max size shift of single file, default is 28 means 1 << 28, 256MB
        ;max_size_shift = 28
    
        # Segment log daily, default is true
        ;daily_rotate = true
    
        # Expired days of log file(delete after max days), default is 7
        ;max_days = 7
    
        [log.syslog]
        ;level =
    
        # log line format, valid options are text, console and json
        ;format = text
    
        # Syslog network type and address. This can be udp, tcp, or unix. If left blank, the default unix endpoints will be used.
        ;network =
        ;address =
    
        # Syslog facility. user, daemon and local0 through local7 are valid.
        ;facility =
    
        # Syslog tag. By default, the process' argv[0] is used.
        ;tag =
    
        #################################### Alerting ############################
        [alerting]
        # Disable alerting engine & UI features
        ;enabled = true
        # Makes it possible to turn off alert rule execution but alerting UI is visible
        ;execute_alerts = true
    
        #################################### Internal Grafana Metrics ##########################
        # Metrics available at HTTP API Url /metrics
        [metrics]
        # Disable / Enable internal metrics
        ;enabled           = true
    
        # Publish interval
        ;interval_seconds  = 10
    
        # Send internal metrics to Graphite
        [metrics.graphite]
        # Enable by setting the address setting (ex localhost:2003)
        ;address =
        ;prefix = prod.grafana.%(instance_name)s.
    
        #################################### Distributed tracing ############
        [tracing.jaeger]
        # Enable by setting the address sending traces to jaeger (ex localhost:6831)
        ;address = localhost:6831
        # Tag that will always be included in when creating new spans. ex (tag1:value1,tag2:value2)
        ;always_included_tag = tag1:value1
        # Type specifies the type of the sampler: const, probabilistic, rateLimiting, or remote
        ;sampler_type = const
        # jaeger samplerconfig param
        # for "const" sampler, 0 or 1 for always false/true respectively
        # for "probabilistic" sampler, a probability between 0 and 1
        # for "rateLimiting" sampler, the number of spans per second
        # for "remote" sampler, param is the same as for "probabilistic"
        # and indicates the initial sampling rate before the actual one
        # is received from the mothership
        ;sampler_param = 1
    
        #################################### Grafana.com integration  ##########################
        # Url used to to import dashboards directly from Grafana.com
        [grafana_com]
        ;url = https://grafana.com
    
        #################################### External image storage ##########################
        [external_image_storage]
        # Used for uploading images to public servers so they can be included in slack/email messages.
        # you can choose between (s3, webdav, gcs, azure_blob, local)
        ;provider =
    
        [external_image_storage.s3]
        ;bucket =
        ;region =
        ;path =
        ;access_key =
        ;secret_key =
    
        [external_image_storage.webdav]
        ;url =
        ;public_url =
        ;username =
        ;password =
    
        [external_image_storage.gcs]
        ;key_file =
        ;bucket =
        ;path =
    
        [external_image_storage.azure_blob]
        ;account_name =
        ;account_key =
        ;container_name =
    
        [external_image_storage.local]
        # does not require any configuration
    
    kind: ConfigMap
    metadata:
      creationTimestamp: null
      name: grafana-etc
      namespace: monitoring
    
    
    vim grafana-deployment.yaml
    apiVersion: extensions/v1beta1
    kind: Deployment
    metadata:
      name: grafana-core
      namespace: monitoring
      labels:
        app: grafana
        component: core
    spec:
      replicas: 1
      template:
        metadata:
          labels:
            app: grafana
            component: core
        spec:
          containers:
          - image: grafana/grafana
            name: grafana-core
            imagePullPolicy: IfNotPresent
            # env:
            resources:
              # keep request = limit to keep this container in guaranteed class
              limits:
                cpu: 200m
                memory: 2048Mi
              requests:
                cpu: 200m
                memory: 2048Mi
            env:
              # The following env variables set up basic auth twith the default admin user and admin password.
              - name: GF_AUTH_BASIC_ENABLED
                value: "true"
              - name: GF_AUTH_ANONYMOUS_ENABLED
                value: "false"
              # - name: GF_AUTH_ANONYMOUS_ORG_ROLE
              #   value: Admin
              # does not really work, because of template variables in exported dashboards:
              # - name: GF_DASHBOARDS_JSON_ENABLED
              #   value: "true"
            readinessProbe:
              httpGet:
                path: /login
                port: 3000
              # initialDelaySeconds: 30
              # timeoutSeconds: 1
            volumeMounts:
            - name: grafana-etc-volume
              mountPath: /etc/grafana/
            - name: grafana-settings
              mountPath: /var/lib/grafana
          volumes:
            - name: grafana-etc-volume
              configMap:
                name: grafana-etc
            - name: grafana-settings
              persistentVolumeClaim:
                claimName: grafana-pvc
    
    
    vim grafana-service.yaml
    apiVersion: v1
    kind: Service
    metadata:
      name: grafana
      namespace: monitoring
      labels:
        app: grafana
        component: core
      annotations:
        prometheus.io/scrape: 'true'
    spec:
      type: NodePort
      ports:
        - port: 3000
          targetPort: 3000
          nodePort: 30902
          protocol: TCP
          name: webui
      selector:
        app: grafana
        component: core
    
    
    mkdir dashboards
    cd dashboards
    #下载dashboards模板
    https://github.com/qist/kubernetes-monitor/tree/master/prometheus/grafana/dashboards
    
    
    #将需要的模板放到kubernetes目录下
    kubectl create configmap "grafana-import-dashboards" --from-file=kubernetes/ --namespace=monitoring
    
    
    vim grafana-job.yaml
    apiVersion: batch/v1
    kind: Job
    metadata:
      name: grafana-import-dashboards
      namespace: monitoring
      labels:
        app: grafana
        component: import-dashboards
    spec:
      template:
        metadata:
          name: grafana-import-dashboards
          labels:
            app: grafana
            component: import-dashboards
          annotations:
            pod.beta.kubernetes.io/init-containers: '[
              {
                "name": "wait-for-endpoints",
                "image": "registry.cn-hangzhou.aliyuncs.com/nevermore/grafana-tiny-tools:v1",
                "imagePullPolicy": "IfNotPresent",
                "command": ["fish", "-c", "echo "waiting for endpoints..."; while true; set endpoints (curl -s --cacert /var/run/secrets/kubernetes.io/serviceaccount/ca.crt --header "Authorization: Bearer "(cat /var/run/secrets/kubernetes.io/serviceaccount/token) https://kubernetes.default.svc/api/v1/namespaces/monitoring/endpoints/grafana); echo $endpoints | jq "."; if test (echo $endpoints | jq -r ".subsets[]?.addresses // [] | length") -gt 0; exit 0; end; echo "waiting...";sleep 1; end"],
                "args": ["monitoring", "grafana"]
              }
            ]'
        spec:
          serviceAccountName: prometheus-k8s
          containers:
          - name: grafana-import-dashboards
            image: registry.cn-hangzhou.aliyuncs.com/nevermore/grafana-tiny-tools:v1
            command: ["/bin/sh", "-c"]
            workingDir: /opt/grafana-import-dashboards
            args:
              - >
                for file in *-datasource.json ; do
                  if [ -e "$file" ] ; then
                    echo "importing $file" &&
                    curl --silent --fail --show-error 
                      --request POST http://admin:admin@grafana:3000/api/datasources 
                      --header "Content-Type: application/json" 
                      --data-binary "@$file" ;
                    echo "" ;
                  fi
                done ;
                for file in *-dashboard.json ; do
                  if [ -e "$file" ] ; then
                    echo "importing $file" &&
                    ( echo '{"dashboard":'; 
                      cat "$file"; 
                      echo ',"overwrite":true,"inputs":[{"name":"DS_PROMETHEUS","type":"datasource","pluginId":"prometheus","value":"prometheus"}]}' ) 
                    | jq -c '.' 
                    | curl --silent --fail --show-error 
                      --request POST http://admin:admin@grafana:3000/api/dashboards/import 
                      --header "Content-Type: application/json" 
                      --data-binary "@-" ;
                    echo "" ;
                  fi
                done
            volumeMounts:
            - name: config-volume
              mountPath: /opt/grafana-import-dashboards
          restartPolicy: Never
          volumes:
          - name: config-volume
            configMap:
              name: grafana-import-dashboards
    
    
    #执行导入数据
    kubectl apply -f grafana-job.yaml
    
    
    kube-state-metrics 服务
    vim kube-state-metrics-rbac.yaml
    apiVersion: v1
    kind: ServiceAccount
    metadata:
      name: kube-state-metrics
      namespace: monitoring
    ---
    apiVersion: rbac.authorization.k8s.io/v1
    kind: ClusterRole
    metadata:
      name: kube-state-metrics
    rules:
    - apiGroups:
      - ""
      resources:
      - configmaps
      - secrets
      - nodes
      - pods
      - services
      - resourcequotas
      - replicationcontrollers
      - limitranges
      - persistentvolumeclaims
      - persistentvolumes
      - namespaces
      - endpoints
      verbs:
      - list
      - watch
    - apiGroups:
      - extensions
      resources:
      - daemonsets
      - deployments
      - replicasets
      - ingresses
      verbs:
      - list
      - watch
    - apiGroups:
      - apps
      resources:
      - statefulsets
      - daemonsets
      - deployments
      - replicasets
      verbs:
      - list
      - watch
    - apiGroups:
      - batch
      resources:
      - cronjobs
      - jobs
      verbs:
      - list
      - watch
    - apiGroups:
      - autoscaling
      resources:
      - horizontalpodautoscalers
      verbs:
      - list
      - watch
    - apiGroups:
      - authentication.k8s.io
      resources:
      - tokenreviews
      verbs:
      - create
    - apiGroups:
      - authorization.k8s.io
      resources:
      - subjectacce***eviews
      verbs:
      - create
    - apiGroups:
      - policy
      resources:
      - poddisruptionbudgets
      verbs:
      - list
      - watch
    - apiGroups: 
      - certificates.k8s.io
      resources:
      - certificatesigningrequests
      verbs: 
      - list
      - watch
    - apiGroups: 
      - storage.k8s.io
      resources:
      - storageclasses
      verbs: 
      - list
      - watch
    ---
    apiVersion: rbac.authorization.k8s.io/v1
    kind: ClusterRoleBinding
    metadata:
      name: kube-state-metrics
    roleRef:
      apiGroup: rbac.authorization.k8s.io
      kind: ClusterRole
      name: kube-state-metrics
    subjects:
    - kind: ServiceAccount
      name: kube-state-metrics
      namespace: monitoring
    ---
    apiVersion: rbac.authorization.k8s.io/v1
    kind: Role
    metadata:
      name: kube-state-metrics
      namespace: monitoring
    rules:
    - apiGroups:
      - ""
      resources:
      - pods
      verbs:
      - get
    - apiGroups:
      - extensions
      resourceNames:
      - kube-state-metrics
      resources:
      - deployments
      verbs:
      - get
      - update
    - apiGroups:
      - apps
      resourceNames:
      - kube-state-metrics
      resources:
      - deployments
      verbs:
      - get
      - update
    ---
    apiVersion: rbac.authorization.k8s.io/v1
    kind: RoleBinding
    metadata:
      name: kube-state-metrics
      namespace: monitoring
    roleRef:
      apiGroup: rbac.authorization.k8s.io
      kind: Role
      name: kube-state-metrics
    subjects:
    - kind: ServiceAccount
      name: kube-state-metrics
    
    
    vim kube-state-metrics-service.yaml
    apiVersion: v1
    kind: Service
    metadata:
      annotations:
        prometheus.io/scrape: 'true'
      name: kube-state-metrics
      namespace: monitoring
      labels:
        k8s-app: kube-state-metrics
    spec:
      ports:
      - name: http-main
        port: 8080
        protocol: TCP
      - name: http-self
        port: 8081
        protocol: TCP
      selector:
        app: kube-state-metrics
    
    
    vim kube-state-metrics-serviceMonitor.yaml
    apiVersion: monitoring.coreos.com/v1
    kind: ServiceMonitor
    metadata:
      labels:
        k8s-app: kube-state-metrics
      name: kube-state-metrics
      namespace: monitoring
    spec:
      endpoints:
      - honorLabels: true
        interval: 30s
        port: http-main
        scheme: http
        scrapeTimeout: 30s
      - interval: 30s
        port: http-self
        scheme: http
      jobLabel: k8s-app
      selector:
        matchLabels:
          k8s-app: kube-state-metrics
    
    
    vim kube-state-metrics-deployment.yaml
    apiVersion: v1
    kind: ConfigMap
    metadata:
      name: nanny-config
      namespace: default
    data:
      NannyConfiguration: |-
        apiVersion: nannyconfig/v1alpha1
        kind: NannyConfiguration
    ---
    apiVersion: apps/v1beta2
    kind: Deployment
    metadata:
      labels:
        app: kube-state-metrics
      name: kube-state-metrics
      namespace: monitoring
    spec:
      replicas: 1
      selector:
        matchLabels:
          app: kube-state-metrics
      template:
        metadata:
          labels:
            app: kube-state-metrics
        spec:
          serviceAccountName: kube-state-metrics
          containers:
          - name: kube-state-metrics
            image: googlecontainer/kube-state-metrics:v1.6.0
            ports:
            - name: http-metrics
              containerPort: 8080
            - name: telemetry
              containerPort: 8081
            readinessProbe:
              httpGet:
                path: /healthz
                port: 8080
              initialDelaySeconds: 10
              timeoutSeconds: 10
          - name: addon-resizer
            image: juestnow/addon-resizer:1.8.5
            resources:
              limits:
                cpu: 100m
                memory: 30Mi
              requests:
                cpu: 100m
                memory: 30Mi
            env:
              - name: MY_POD_NAME
                valueFrom:
                  fieldRef:
                    fieldPath: metadata.name
              - name: MY_POD_NAMESPACE
                valueFrom:
                  fieldRef:
                    fieldPath: metadata.namespace
            command:
              - /pod_nanny
              - --container=kube-state-metrics
              - --cpu=100m
              - --extra-cpu=1m
              - --memory=200Mi
              - --extra-memory=2Mi
              - --threshold=5
              - --deployment=kube-state-metrics
          nodeSelector:
            beta.kubernetes.io/os: linux
          serviceAccountName: kube-state-metrics
    
    
    #创建
    kubectl apply -f .
    

      

  • 相关阅读:
    动态规划之最大子段和问题
    hdu1203 I NEED A OFFER!---概率DP(01背包)
    hdu1087 Super Jumping! Jumping! Jumping!---基础DP---递增子序列最大和
    hdu2062 Subset sequence----递推
    java线程基础巩固---通过实验分析This锁和Class锁的存在
    java8学习之BiFunction函数式接口实例演示&Predicate函数式接口详解
    java8学习之Function与BiFunction函数式接口详解
    java8学习之Lambda表达式继续探讨&Function接口详解
    java8学习之Lambda表达式深入与流初步
    java8学习之深入函数式接口与方法引用
  • 原文地址:https://www.cnblogs.com/xieyi5420/p/13474215.html
Copyright © 2011-2022 走看看